cow_http_hd.erl 124 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638163916401641164216431644164516461647164816491650165116521653165416551656165716581659166016611662166316641665166616671668166916701671167216731674167516761677167816791680168116821683168416851686168716881689169016911692169316941695169616971698169917001701170217031704170517061707170817091710171117121713171417151716171717181719172017211722172317241725172617271728172917301731173217331734173517361737173817391740174117421743174417451746174717481749175017511752175317541755175617571758175917601761176217631764176517661767176817691770177117721773177417751776177717781779178017811782178317841785178617871788178917901791179217931794179517961797179817991800180118021803180418051806180718081809181018111812181318141815181618171818181918201821182218231824182518261827182818291830183118321833183418351836183718381839184018411842184318441845184618471848184918501851185218531854185518561857185818591860186118621863186418651866186718681869187018711872187318741875187618771878187918801881188218831884188518861887188818891890189118921893189418951896189718981899190019011902190319041905190619071908190919101911191219131914191519161917191819191920192119221923192419251926192719281929193019311932193319341935193619371938193919401941194219431944194519461947194819491950195119521953195419551956195719581959196019611962196319641965196619671968196919701971197219731974197519761977197819791980198119821983198419851986198719881989199019911992199319941995199619971998199920002001200220032004200520062007200820092010201120122013201420152016201720182019202020212022202320242025202620272028202920302031203220332034203520362037203820392040204120422043204420452046204720482049205020512052205320542055205620572058205920602061206220632064206520662067206820692070207120722073207420752076207720782079208020812082208320842085208620872088208920902091209220932094209520962097209820992100210121022103210421052106210721082109211021112112211321142115211621172118211921202121212221232124212521262127212821292130213121322133213421352136213721382139214021412142214321442145214621472148214921502151215221532154215521562157215821592160216121622163216421652166216721682169217021712172217321742175217621772178217921802181218221832184218521862187218821892190219121922193219421952196219721982199220022012202220322042205220622072208220922102211221222132214221522162217221822192220222122222223222422252226222722282229223022312232223322342235223622372238223922402241224222432244224522462247224822492250225122522253225422552256225722582259226022612262226322642265226622672268226922702271227222732274227522762277227822792280228122822283228422852286228722882289229022912292229322942295229622972298229923002301230223032304230523062307230823092310231123122313231423152316231723182319232023212322232323242325232623272328232923302331233223332334233523362337233823392340234123422343234423452346234723482349235023512352235323542355235623572358235923602361236223632364236523662367236823692370237123722373237423752376237723782379238023812382238323842385238623872388238923902391239223932394239523962397239823992400240124022403240424052406240724082409241024112412241324142415241624172418241924202421242224232424242524262427242824292430243124322433243424352436243724382439244024412442244324442445244624472448244924502451245224532454245524562457245824592460246124622463246424652466246724682469247024712472247324742475247624772478247924802481248224832484248524862487248824892490249124922493249424952496249724982499250025012502250325042505250625072508250925102511251225132514251525162517251825192520252125222523252425252526252725282529253025312532253325342535253625372538253925402541254225432544254525462547254825492550255125522553255425552556255725582559256025612562256325642565256625672568256925702571257225732574257525762577257825792580258125822583258425852586258725882589259025912592259325942595259625972598259926002601260226032604260526062607260826092610261126122613261426152616261726182619262026212622262326242625262626272628262926302631263226332634263526362637263826392640264126422643264426452646264726482649265026512652265326542655265626572658265926602661266226632664266526662667266826692670267126722673267426752676267726782679268026812682268326842685268626872688268926902691269226932694269526962697269826992700270127022703270427052706270727082709271027112712271327142715271627172718271927202721272227232724272527262727272827292730273127322733273427352736273727382739274027412742274327442745274627472748274927502751275227532754275527562757275827592760276127622763276427652766276727682769277027712772277327742775277627772778277927802781278227832784278527862787278827892790279127922793279427952796279727982799280028012802280328042805280628072808280928102811281228132814281528162817281828192820282128222823282428252826282728282829283028312832283328342835283628372838283928402841284228432844284528462847284828492850285128522853285428552856285728582859286028612862286328642865286628672868286928702871287228732874287528762877287828792880288128822883288428852886288728882889289028912892289328942895289628972898289929002901290229032904290529062907290829092910291129122913291429152916291729182919292029212922292329242925292629272928292929302931293229332934293529362937293829392940294129422943294429452946294729482949295029512952295329542955295629572958295929602961296229632964296529662967296829692970297129722973297429752976297729782979298029812982298329842985298629872988298929902991299229932994299529962997299829993000300130023003300430053006300730083009301030113012301330143015301630173018301930203021302230233024302530263027302830293030303130323033303430353036303730383039304030413042304330443045304630473048304930503051305230533054305530563057305830593060306130623063306430653066306730683069307030713072307330743075307630773078307930803081308230833084308530863087308830893090309130923093309430953096309730983099310031013102310331043105310631073108310931103111311231133114311531163117311831193120312131223123312431253126312731283129313031313132313331343135313631373138313931403141314231433144314531463147314831493150315131523153315431553156315731583159316031613162316331643165316631673168316931703171317231733174317531763177317831793180318131823183318431853186318731883189319031913192319331943195319631973198319932003201320232033204320532063207320832093210321132123213321432153216321732183219322032213222322332243225322632273228322932303231323232333234323532363237323832393240324132423243324432453246324732483249325032513252325332543255325632573258325932603261326232633264326532663267326832693270327132723273327432753276327732783279328032813282328332843285328632873288328932903291329232933294329532963297329832993300330133023303330433053306330733083309331033113312331333143315331633173318331933203321332233233324332533263327332833293330333133323333333433353336333733383339334033413342334333443345334633473348334933503351335233533354335533563357335833593360336133623363336433653366336733683369337033713372337333743375337633773378337933803381338233833384338533863387338833893390339133923393339433953396339733983399
  1. %% Copyright (c) 2014-2015, Loïc Hoguin <essen@ninenines.eu>
  2. %%
  3. %% Permission to use, copy, modify, and/or distribute this software for any
  4. %% purpose with or without fee is hereby granted, provided that the above
  5. %% copyright notice and this permission notice appear in all copies.
  6. %%
  7. %% THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
  8. %% WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
  9. %% MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
  10. %% ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
  11. %% WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
  12. %% ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
  13. %% OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
  14. -module(cow_http_hd).
  15. %% Parsing.
  16. -export([parse_accept/1]).
  17. -export([parse_accept_charset/1]).
  18. % @todo -export([parse_accept_datetime/1]). RFC7089
  19. -export([parse_accept_encoding/1]).
  20. % @todo -export([parse_accept_features/1]). RFC2295
  21. -export([parse_accept_language/1]).
  22. -export([parse_accept_ranges/1]).
  23. % @todo -export([parse_access_control_allow_credentials/1]). CORS
  24. % @todo -export([parse_access_control_allow_headers/1]). CORS
  25. % @todo -export([parse_access_control_allow_methods/1]). CORS
  26. % @todo -export([parse_access_control_allow_origin/1]). CORS
  27. % @todo -export([parse_access_control_expose_headers/1]). CORS
  28. % @todo -export([parse_access_control_max_age/1]). CORS
  29. -export([parse_access_control_request_headers/1]).
  30. -export([parse_access_control_request_method/1]).
  31. -export([parse_age/1]).
  32. -export([parse_allow/1]).
  33. % @todo -export([parse_alternates/1]). RFC2295
  34. % @todo -export([parse_authentication_info/1]). RFC2617
  35. -export([parse_authorization/1]).
  36. -export([parse_cache_control/1]).
  37. -export([parse_connection/1]).
  38. % @todo -export([parse_content_disposition/1]). RFC6266
  39. -export([parse_content_encoding/1]).
  40. -export([parse_content_language/1]).
  41. -export([parse_content_length/1]).
  42. % @todo -export([parse_content_location/1]). RFC7231
  43. % @todo -export([parse_content_md5/1]). RFC2616 (deprecated)
  44. -export([parse_content_range/1]).
  45. % @todo -export([parse_content_security_policy/1]). CSP
  46. % @todo -export([parse_content_security_policy_report_only/1]). CSP
  47. -export([parse_content_type/1]).
  48. % @todo -export([parse_cookie/1]). RFC6265
  49. -export([parse_date/1]).
  50. % @todo -export([parse_digest/1]). RFC3230
  51. % @todo -export([parse_dnt/1]). http://donottrack.us/
  52. -export([parse_etag/1]).
  53. -export([parse_expect/1]).
  54. -export([parse_expires/1]).
  55. % @todo -export([parse_forwarded/1]). RFC7239
  56. % @todo -export([parse_from/1]). RFC7231
  57. -export([parse_host/1]).
  58. -export([parse_http2_settings/1]).
  59. -export([parse_if_match/1]).
  60. -export([parse_if_modified_since/1]).
  61. -export([parse_if_none_match/1]).
  62. -export([parse_if_range/1]).
  63. -export([parse_if_unmodified_since/1]).
  64. % @todo -export([parse_last_event_id/1]). eventsource
  65. -export([parse_last_modified/1]).
  66. % @todo -export([parse_link/1]). RFC5988
  67. % @todo -export([parse_location/1]). RFC7231
  68. -export([parse_max_forwards/1]).
  69. % @todo -export([parse_memento_datetime/1]). RFC7089
  70. % @todo -export([parse_negotiate/1]). RFC2295
  71. -export([parse_origin/1]).
  72. -export([parse_pragma/1]).
  73. % @todo -export([parse_prefer/1]). RFC7240
  74. -export([parse_proxy_authenticate/1]).
  75. % @todo -export([parse_proxy_authentication_info/1]). RFC2617
  76. -export([parse_proxy_authorization/1]).
  77. % @todo -export([parse_proxy_support/1]). RFC4559
  78. % @todo -export([parse_public_key_pins/1]). Key Pinning (upcoming)
  79. % @todo -export([parse_public_key_pins_report_only/1]). Key Pinning (upcoming)
  80. -export([parse_range/1]).
  81. % @todo -export([parse_referer/1]). RFC7231
  82. % @todo -export([parse_refresh/1]). Non-standard (examples: "5", "5; url=http://example.com/")
  83. -export([parse_retry_after/1]).
  84. -export([parse_sec_websocket_accept/1]).
  85. -export([parse_sec_websocket_extensions/1]).
  86. -export([parse_sec_websocket_key/1]).
  87. % @todo -export([parse_sec_websocket_origin/1]). Websocket drafts 7 and 8
  88. -export([parse_sec_websocket_protocol_req/1]).
  89. -export([parse_sec_websocket_protocol_resp/1]).
  90. -export([parse_sec_websocket_version_req/1]).
  91. -export([parse_sec_websocket_version_resp/1]).
  92. % @todo -export([parse_server/1]). RFC7231
  93. % @todo -export([parse_set_cookie/1]). RFC6265
  94. % @todo -export([parse_strict_transport_security/1]). RFC6797
  95. % @todo -export([parse_tcn/1]). RFC2295
  96. -export([parse_te/1]).
  97. -export([parse_trailer/1]).
  98. -export([parse_transfer_encoding/1]).
  99. -export([parse_upgrade/1]).
  100. % @todo -export([parse_user_agent/1]). RFC7231
  101. % @todo -export([parse_variant_vary/1]). RFC2295
  102. -export([parse_vary/1]).
  103. % @todo -export([parse_via/1]). RFC7230
  104. % @todo -export([parse_want_digest/1]). RFC3230
  105. % @todo -export([parse_warning/1]). RFC7234
  106. -export([parse_www_authenticate/1]).
  107. % @todo -export([parse_x_content_duration/1]). Gecko/MDN (value: float)
  108. % @todo -export([parse_x_dns_prefetch_control/1]). Various (value: "on"|"off")
  109. -export([parse_x_forwarded_for/1]).
  110. % @todo -export([parse_x_frame_options/1]). RFC7034
  111. %% Building.
  112. -export([access_control_allow_credentials/0]).
  113. -export([access_control_allow_headers/1]).
  114. -export([access_control_allow_methods/1]).
  115. -export([access_control_allow_origin/1]).
  116. -export([access_control_expose_headers/1]).
  117. -export([access_control_max_age/1]).
  118. -type etag() :: {weak | strong, binary()}.
  119. -export_type([etag/0]).
  120. -type media_type() :: {binary(), binary(), [{binary(), binary()}]}.
  121. -export_type([media_type/0]).
  122. -type qvalue() :: 0..1000.
  123. -export_type([qvalue/0]).
  124. -type websocket_version() :: 0..255.
  125. -export_type([websocket_version/0]).
  126. -include("cow_inline.hrl").
  127. -include("cow_parse.hrl").
  128. -ifdef(TEST).
  129. -include_lib("triq/include/triq.hrl").
  130. vector(Min, Max, Dom) -> ?LET(N, choose(Min, Max), vector(N, Dom)).
  131. small_list(Dom) -> vector(0, 10, Dom).
  132. small_non_empty_list(Dom) -> vector(1, 10, Dom).
  133. alpha_chars() -> "abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ".
  134. alphanum_chars() -> "0123456789abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ".
  135. digit_chars() -> "0123456789".
  136. ows() -> list(elements([$\s, $\t])).
  137. alpha() -> elements(alpha_chars()).
  138. alphanum() -> elements(alphanum_chars()).
  139. digit() -> elements(digit_chars()).
  140. tchar() ->
  141. frequency([
  142. {1, elements([$!, $#, $$, $%, $&, $', $*, $+, $-, $., $^, $_, $`, $|, $~])},
  143. {99, elements(alphanum_chars())}
  144. ]).
  145. token() ->
  146. ?LET(T,
  147. non_empty(list(tchar())),
  148. list_to_binary(T)).
  149. abnf_char() ->
  150. int(1, 127).
  151. vchar() ->
  152. int(33, 126).
  153. obs_text() ->
  154. int(128, 255).
  155. qdtext() ->
  156. frequency([
  157. {99, elements("\t\s!#$%&'()*+,-./0123456789:;<=>?@ABCDEFGHIJKLMNOPQRSTUVWXYZ[]^_`abcdefghijklmnopqrstuvwxyz{|}~")},
  158. {1, obs_text()}
  159. ]).
  160. quoted_pair() ->
  161. [$\\, frequency([
  162. {99, elements("\t\s!\"#$%&'()*+,-./0123456789:;<=>?@ABCDEFGHIJKLMNOPQRSTUVWXYZ[\\]^_`abcdefghijklmnopqrstuvwxyz{|}~")},
  163. {1, obs_text()}
  164. ])].
  165. quoted_string() ->
  166. [$", list(frequency([{100, qdtext()}, {1, quoted_pair()}])), $"].
  167. %% Helper function for ( token / quoted-string ) values.
  168. unquote([$", V, $"]) -> unquote(V, <<>>);
  169. unquote(V) -> V.
  170. unquote([], Acc) -> Acc;
  171. unquote([[$\\, C]|Tail], Acc) -> unquote(Tail, << Acc/binary, C >>);
  172. unquote([C|Tail], Acc) -> unquote(Tail, << Acc/binary, C >>).
  173. parameter() ->
  174. ?SUCHTHAT({K, _, _, _},
  175. {token(), oneof([token(), quoted_string()]), ows(), ows()},
  176. K =/= <<"q">>).
  177. weight() ->
  178. frequency([
  179. {90, int(0, 1000)},
  180. {10, undefined}
  181. ]).
  182. %% Helper function for weight's qvalue formatting.
  183. qvalue_to_iodata(0) -> <<"0">>;
  184. qvalue_to_iodata(Q) when Q < 10 -> [<<"0.00">>, integer_to_binary(Q)];
  185. qvalue_to_iodata(Q) when Q < 100 -> [<<"0.0">>, integer_to_binary(Q)];
  186. qvalue_to_iodata(Q) when Q < 1000 -> [<<"0.">>, integer_to_binary(Q)];
  187. qvalue_to_iodata(1000) -> <<"1">>.
  188. -endif.
  189. %% Parsing.
  190. %% @doc Parse the Accept header.
  191. -spec parse_accept(binary()) -> [{media_type(), qvalue(), [binary() | {binary(), binary()}]}].
  192. parse_accept(<<"*/*">>) ->
  193. [{{<<"*">>, <<"*">>, []}, 1000, []}];
  194. parse_accept(Accept) ->
  195. media_range_list(Accept, []).
  196. media_range_list(<< C, R/bits >>, Acc) when ?IS_TOKEN(C) -> ?LOWER(media_range_type, R, Acc, <<>>);
  197. media_range_list(<< C, R/bits >>, Acc) when ?IS_WS_COMMA(C) -> media_range_list(R, Acc);
  198. media_range_list(<<>>, Acc) -> lists:reverse(Acc).
  199. media_range_type(<< C, R/bits >>, Acc, T) when ?IS_TOKEN(C) -> ?LOWER(media_range_type, R, Acc, T);
  200. media_range_type(<< $/, C, R/bits >>, Acc, T) when ?IS_TOKEN(C) -> ?LOWER(media_range_subtype, R, Acc, T, <<>>);
  201. %% Special clause for badly behaving user agents that send * instead of */*.
  202. media_range_type(<< $;, R/bits >>, Acc, <<"*">>) -> media_range_before_param(R, Acc, <<"*">>, <<"*">>, []).
  203. media_range_subtype(<< C, R/bits >>, Acc, T, S) when ?IS_TOKEN(C) -> ?LOWER(media_range_subtype, R, Acc, T, S);
  204. media_range_subtype(R, Acc, T, S) -> media_range_param_sep(R, Acc, T, S, []).
  205. media_range_param_sep(<<>>, Acc, T, S, P) -> lists:reverse([{{T, S, lists:reverse(P)}, 1000, []}|Acc]);
  206. media_range_param_sep(<< $,, R/bits >>, Acc, T, S, P) -> media_range_list(R, [{{T, S, lists:reverse(P)}, 1000, []}|Acc]);
  207. media_range_param_sep(<< $;, R/bits >>, Acc, T, S, P) -> media_range_before_param(R, Acc, T, S, P);
  208. media_range_param_sep(<< C, R/bits >>, Acc, T, S, P) when ?IS_WS(C) -> media_range_param_sep(R, Acc, T, S, P).
  209. media_range_before_param(<< C, R/bits >>, Acc, T, S, P) when ?IS_WS(C) -> media_range_before_param(R, Acc, T, S, P);
  210. media_range_before_param(<< $q, $=, R/bits >>, Acc, T, S, P) -> media_range_weight(R, Acc, T, S, P);
  211. media_range_before_param(<< C, R/bits >>, Acc, T, S, P) when ?IS_TOKEN(C) -> ?LOWER(media_range_param, R, Acc, T, S, P, <<>>).
  212. media_range_param(<< $=, $", R/bits >>, Acc, T, S, P, K) -> media_range_quoted(R, Acc, T, S, P, K, <<>>);
  213. media_range_param(<< $=, C, R/bits >>, Acc, T, S, P, K) when ?IS_TOKEN(C) -> media_range_value(R, Acc, T, S, P, K, << C >>);
  214. media_range_param(<< C, R/bits >>, Acc, T, S, P, K) when ?IS_TOKEN(C) -> ?LOWER(media_range_param, R, Acc, T, S, P, K).
  215. media_range_quoted(<< $", R/bits >>, Acc, T, S, P, K, V) -> media_range_param_sep(R, Acc, T, S, [{K, V}|P]);
  216. media_range_quoted(<< $\\, C, R/bits >>, Acc, T, S, P, K, V) when ?IS_VCHAR_OBS(C) -> media_range_quoted(R, Acc, T, S, P, K, << V/binary, C >>);
  217. media_range_quoted(<< C, R/bits >>, Acc, T, S, P, K, V) when ?IS_VCHAR_OBS(C) -> media_range_quoted(R, Acc, T, S, P, K, << V/binary, C >>).
  218. media_range_value(<< C, R/bits >>, Acc, T, S, P, K, V) when ?IS_TOKEN(C) -> media_range_value(R, Acc, T, S, P, K, << V/binary, C >>);
  219. media_range_value(R, Acc, T, S, P, K, V) -> media_range_param_sep(R, Acc, T, S, [{K, V}|P]).
  220. media_range_weight(<< "1.000", R/bits >>, Acc, T, S, P) -> accept_ext_sep(R, Acc, T, S, P, 1000, []);
  221. media_range_weight(<< "1.00", R/bits >>, Acc, T, S, P) -> accept_ext_sep(R, Acc, T, S, P, 1000, []);
  222. media_range_weight(<< "1.0", R/bits >>, Acc, T, S, P) -> accept_ext_sep(R, Acc, T, S, P, 1000, []);
  223. media_range_weight(<< "1.", R/bits >>, Acc, T, S, P) -> accept_ext_sep(R, Acc, T, S, P, 1000, []);
  224. media_range_weight(<< "1", R/bits >>, Acc, T, S, P) -> accept_ext_sep(R, Acc, T, S, P, 1000, []);
  225. media_range_weight(<< "0.", A, B, C, R/bits >>, Acc, T, S, P) when ?IS_DIGIT(A), ?IS_DIGIT(B), ?IS_DIGIT(C) ->
  226. accept_ext_sep(R, Acc, T, S, P, (A - $0) * 100 + (B - $0) * 10 + (C - $0), []);
  227. media_range_weight(<< "0.", A, B, R/bits >>, Acc, T, S, P) when ?IS_DIGIT(A), ?IS_DIGIT(B) ->
  228. accept_ext_sep(R, Acc, T, S, P, (A - $0) * 100 + (B - $0) * 10, []);
  229. media_range_weight(<< "0.", A, R/bits >>, Acc, T, S, P) when ?IS_DIGIT(A) ->
  230. accept_ext_sep(R, Acc, T, S, P, (A - $0) * 100, []);
  231. media_range_weight(<< "0.", R/bits >>, Acc, T, S, P) -> accept_ext_sep(R, Acc, T, S, P, 0, []);
  232. media_range_weight(<< "0", R/bits >>, Acc, T, S, P) -> accept_ext_sep(R, Acc, T, S, P, 0, []);
  233. %% Special clauses for badly behaving user agents that send .123 instead of 0.123.
  234. media_range_weight(<< ".", A, B, C, R/bits >>, Acc, T, S, P) when ?IS_DIGIT(A), ?IS_DIGIT(B), ?IS_DIGIT(C) ->
  235. accept_ext_sep(R, Acc, T, S, P, (A - $0) * 100 + (B - $0) * 10 + (C - $0), []);
  236. media_range_weight(<< ".", A, B, R/bits >>, Acc, T, S, P) when ?IS_DIGIT(A), ?IS_DIGIT(B) ->
  237. accept_ext_sep(R, Acc, T, S, P, (A - $0) * 100 + (B - $0) * 10, []);
  238. media_range_weight(<< ".", A, R/bits >>, Acc, T, S, P) when ?IS_DIGIT(A) ->
  239. accept_ext_sep(R, Acc, T, S, P, (A - $0) * 100, []).
  240. accept_ext_sep(<<>>, Acc, T, S, P, Q, E) -> lists:reverse([{{T, S, lists:reverse(P)}, Q, lists:reverse(E)}|Acc]);
  241. accept_ext_sep(<< $,, R/bits >>, Acc, T, S, P, Q, E) -> media_range_list(R, [{{T, S, lists:reverse(P)}, Q, lists:reverse(E)}|Acc]);
  242. accept_ext_sep(<< $;, R/bits >>, Acc, T, S, P, Q, E) -> accept_before_ext(R, Acc, T, S, P, Q, E);
  243. accept_ext_sep(<< C, R/bits >>, Acc, T, S, P, Q, E) when ?IS_WS(C) -> accept_ext_sep(R, Acc, T, S, P, Q, E).
  244. accept_before_ext(<< C, R/bits >>, Acc, T, S, P, Q, E) when ?IS_WS(C) -> accept_before_ext(R, Acc, T, S, P, Q, E);
  245. accept_before_ext(<< C, R/bits >>, Acc, T, S, P, Q, E) when ?IS_TOKEN(C) -> ?LOWER(accept_ext, R, Acc, T, S, P, Q, E, <<>>).
  246. accept_ext(<< $=, $", R/bits >>, Acc, T, S, P, Q, E, K) -> accept_quoted(R, Acc, T, S, P, Q, E, K, <<>>);
  247. accept_ext(<< $=, C, R/bits >>, Acc, T, S, P, Q, E, K) when ?IS_TOKEN(C) -> accept_value(R, Acc, T, S, P, Q, E, K, << C >>);
  248. accept_ext(<< C, R/bits >>, Acc, T, S, P, Q, E, K) when ?IS_TOKEN(C) -> ?LOWER(accept_ext, R, Acc, T, S, P, Q, E, K);
  249. accept_ext(R, Acc, T, S, P, Q, E, K) -> accept_ext_sep(R, Acc, T, S, P, Q, [K|E]).
  250. accept_quoted(<< $", R/bits >>, Acc, T, S, P, Q, E, K, V) -> accept_ext_sep(R, Acc, T, S, P, Q, [{K, V}|E]);
  251. accept_quoted(<< $\\, C, R/bits >>, Acc, T, S, P, Q, E, K, V) when ?IS_VCHAR_OBS(C) -> accept_quoted(R, Acc, T, S, P, Q, E, K, << V/binary, C >>);
  252. accept_quoted(<< C, R/bits >>, Acc, T, S, P, Q, E, K, V) when ?IS_VCHAR_OBS(C) -> accept_quoted(R, Acc, T, S, P, Q, E, K, << V/binary, C >>).
  253. accept_value(<< C, R/bits >>, Acc, T, S, P, Q, E, K, V) when ?IS_TOKEN(C) -> accept_value(R, Acc, T, S, P, Q, E, K, << V/binary, C >>);
  254. accept_value(R, Acc, T, S, P, Q, E, K, V) -> accept_ext_sep(R, Acc, T, S, P, Q, [{K, V}|E]).
  255. -ifdef(TEST).
  256. accept_ext() ->
  257. oneof([token(), parameter()]).
  258. accept_params() ->
  259. frequency([
  260. {90, []},
  261. {10, small_list(accept_ext())}
  262. ]).
  263. accept() ->
  264. ?LET({T, S, P, W, E},
  265. {token(), token(), small_list(parameter()), weight(), accept_params()},
  266. {T, S, P, W, E, iolist_to_binary([T, $/, S,
  267. [[OWS1, $;, OWS2, K, $=, V] || {K, V, OWS1, OWS2} <- P],
  268. case W of
  269. undefined -> [];
  270. _ -> [
  271. [<<";q=">>, qvalue_to_iodata(W)],
  272. [case Ext of
  273. {K, V, OWS1, OWS2} -> [OWS1, $;, OWS2, K, $=, V];
  274. K -> [$;, K]
  275. end || Ext <- E]]
  276. end])}
  277. ).
  278. prop_parse_accept() ->
  279. ?FORALL(L,
  280. vector(1, 50, accept()),
  281. begin
  282. << _, Accept/binary >> = iolist_to_binary([[$,, A] || {_, _, _, _, _, A} <- L]),
  283. ResL = parse_accept(Accept),
  284. CheckedL = [begin
  285. ExpectedP = [{?LOWER(K), unquote(V)} || {K, V, _, _} <- P],
  286. ExpectedE = [case Ext of
  287. {K, V, _, _} -> {?LOWER(K), unquote(V)};
  288. K -> ?LOWER(K)
  289. end || Ext <- E],
  290. ResT =:= ?LOWER(T)
  291. andalso ResS =:= ?LOWER(S)
  292. andalso ResP =:= ExpectedP
  293. andalso (ResW =:= W orelse (W =:= undefined andalso ResW =:= 1000))
  294. andalso ((W =:= undefined andalso ResE =:= []) orelse (W =/= undefined andalso ResE =:= ExpectedE))
  295. end || {{T, S, P, W, E, _}, {{ResT, ResS, ResP}, ResW, ResE}} <- lists:zip(L, ResL)],
  296. [true] =:= lists:usort(CheckedL)
  297. end
  298. ).
  299. parse_accept_test_() ->
  300. Tests = [
  301. {<<>>, []},
  302. {<<" ">>, []},
  303. {<<"audio/*; q=0.2, audio/basic">>, [
  304. {{<<"audio">>, <<"*">>, []}, 200, []},
  305. {{<<"audio">>, <<"basic">>, []}, 1000, []}
  306. ]},
  307. {<<"text/plain; q=0.5, text/html, "
  308. "text/x-dvi; q=0.8, text/x-c">>, [
  309. {{<<"text">>, <<"plain">>, []}, 500, []},
  310. {{<<"text">>, <<"html">>, []}, 1000, []},
  311. {{<<"text">>, <<"x-dvi">>, []}, 800, []},
  312. {{<<"text">>, <<"x-c">>, []}, 1000, []}
  313. ]},
  314. {<<"text/*, text/html, text/html;level=1, */*">>, [
  315. {{<<"text">>, <<"*">>, []}, 1000, []},
  316. {{<<"text">>, <<"html">>, []}, 1000, []},
  317. {{<<"text">>, <<"html">>, [{<<"level">>, <<"1">>}]}, 1000, []},
  318. {{<<"*">>, <<"*">>, []}, 1000, []}
  319. ]},
  320. {<<"text/*;q=0.3, text/html;q=0.7, text/html;level=1, "
  321. "text/html;level=2;q=0.4, */*;q=0.5">>, [
  322. {{<<"text">>, <<"*">>, []}, 300, []},
  323. {{<<"text">>, <<"html">>, []}, 700, []},
  324. {{<<"text">>, <<"html">>, [{<<"level">>, <<"1">>}]}, 1000, []},
  325. {{<<"text">>, <<"html">>, [{<<"level">>, <<"2">>}]}, 400, []},
  326. {{<<"*">>, <<"*">>, []}, 500, []}
  327. ]},
  328. {<<"text/html;level=1;quoted=\"hi hi hi\";"
  329. "q=0.123;standalone;complex=gits, text/plain">>, [
  330. {{<<"text">>, <<"html">>,
  331. [{<<"level">>, <<"1">>}, {<<"quoted">>, <<"hi hi hi">>}]}, 123,
  332. [<<"standalone">>, {<<"complex">>, <<"gits">>}]},
  333. {{<<"text">>, <<"plain">>, []}, 1000, []}
  334. ]},
  335. {<<"text/html, image/gif, image/jpeg, *; q=.2, */*; q=.2">>, [
  336. {{<<"text">>, <<"html">>, []}, 1000, []},
  337. {{<<"image">>, <<"gif">>, []}, 1000, []},
  338. {{<<"image">>, <<"jpeg">>, []}, 1000, []},
  339. {{<<"*">>, <<"*">>, []}, 200, []},
  340. {{<<"*">>, <<"*">>, []}, 200, []}
  341. ]}
  342. ],
  343. [{V, fun() -> R = parse_accept(V) end} || {V, R} <- Tests].
  344. parse_accept_error_test_() ->
  345. Tests = [
  346. <<"audio/basic, */;q=0.5">>,
  347. <<"audio/, audio/basic">>,
  348. <<"aud\tio/basic">>,
  349. <<"audio/basic;t=\"zero \\", 0, " woo\"">>
  350. ],
  351. [{V, fun() -> {'EXIT', _} = (catch parse_accept(V)) end} || V <- Tests].
  352. horse_parse_accept() ->
  353. horse:repeat(20000,
  354. parse_accept(<<"text/*;q=0.3, text/html;q=0.7, text/html;level=1, "
  355. "text/html;level=2;q=0.4, */*;q=0.5">>)
  356. ).
  357. -endif.
  358. %% @doc Parse the Accept-Charset header.
  359. -spec parse_accept_charset(binary()) -> [{binary(), qvalue()}].
  360. parse_accept_charset(Charset) ->
  361. nonempty(conneg_list(Charset, [])).
  362. conneg_list(<<>>, Acc) -> lists:reverse(Acc);
  363. conneg_list(<< C, R/bits >>, Acc) when ?IS_WS_COMMA(C) -> conneg_list(R, Acc);
  364. conneg_list(<< C, R/bits >>, Acc) when ?IS_TOKEN(C) -> ?LOWER(conneg, R, Acc, <<>>).
  365. conneg(<< C, R/bits >>, Acc, T) when ?IS_TOKEN(C) -> ?LOWER(conneg, R, Acc, T);
  366. conneg(R, Acc, T) -> conneg_param_sep(R, Acc, T).
  367. conneg_param_sep(<<>>, Acc, T) -> lists:reverse([{T, 1000}|Acc]);
  368. conneg_param_sep(<< $,, R/bits >>, Acc, T) -> conneg_list(R, [{T, 1000}|Acc]);
  369. conneg_param_sep(<< $;, R/bits >>, Acc, T) -> conneg_before_weight(R, Acc, T);
  370. conneg_param_sep(<< C, R/bits >>, Acc, T) when ?IS_WS(C) -> conneg_param_sep(R, Acc, T).
  371. conneg_before_weight(<< C, R/bits >>, Acc, T) when ?IS_WS(C) -> conneg_before_weight(R, Acc, T);
  372. conneg_before_weight(<< $q, $=, R/bits >>, Acc, T) -> conneg_weight(R, Acc, T);
  373. %% Special clause for broken user agents that confuse ; and , separators.
  374. conneg_before_weight(<< C, R/bits >>, Acc, T) when ?IS_TOKEN(C) -> ?LOWER(conneg, R, [{T, 1000}|Acc], <<>>).
  375. conneg_weight(<< "1.000", R/bits >>, Acc, T) -> conneg_list_sep(R, [{T, 1000}|Acc]);
  376. conneg_weight(<< "1.00", R/bits >>, Acc, T) -> conneg_list_sep(R, [{T, 1000}|Acc]);
  377. conneg_weight(<< "1.0", R/bits >>, Acc, T) -> conneg_list_sep(R, [{T, 1000}|Acc]);
  378. conneg_weight(<< "1.", R/bits >>, Acc, T) -> conneg_list_sep(R, [{T, 1000}|Acc]);
  379. conneg_weight(<< "1", R/bits >>, Acc, T) -> conneg_list_sep(R, [{T, 1000}|Acc]);
  380. conneg_weight(<< "0.", A, B, C, R/bits >>, Acc, T) when ?IS_DIGIT(A), ?IS_DIGIT(B), ?IS_DIGIT(C) ->
  381. conneg_list_sep(R, [{T, (A - $0) * 100 + (B - $0) * 10 + (C - $0)}|Acc]);
  382. conneg_weight(<< "0.", A, B, R/bits >>, Acc, T) when ?IS_DIGIT(A), ?IS_DIGIT(B) ->
  383. conneg_list_sep(R, [{T, (A - $0) * 100 + (B - $0) * 10}|Acc]);
  384. conneg_weight(<< "0.", A, R/bits >>, Acc, T) when ?IS_DIGIT(A) ->
  385. conneg_list_sep(R, [{T, (A - $0) * 100}|Acc]);
  386. conneg_weight(<< "0.", R/bits >>, Acc, T) -> conneg_list_sep(R, [{T, 0}|Acc]);
  387. conneg_weight(<< "0", R/bits >>, Acc, T) -> conneg_list_sep(R, [{T, 0}|Acc]).
  388. conneg_list_sep(<<>>, Acc) -> lists:reverse(Acc);
  389. conneg_list_sep(<< C, R/bits >>, Acc) when ?IS_WS(C) -> conneg_list_sep(R, Acc);
  390. conneg_list_sep(<< $,, R/bits >>, Acc) -> conneg_list(R, Acc).
  391. -ifdef(TEST).
  392. accept_charset() ->
  393. ?LET({C, W},
  394. {token(), weight()},
  395. {C, W, iolist_to_binary([C, case W of
  396. undefined -> [];
  397. _ -> [<<";q=">>, qvalue_to_iodata(W)]
  398. end])}
  399. ).
  400. prop_parse_accept_charset() ->
  401. ?FORALL(L,
  402. non_empty(list(accept_charset())),
  403. begin
  404. << _, AcceptCharset/binary >> = iolist_to_binary([[$,, A] || {_, _, A} <- L]),
  405. ResL = parse_accept_charset(AcceptCharset),
  406. CheckedL = [begin
  407. ResC =:= ?LOWER(Ch)
  408. andalso (ResW =:= W orelse (W =:= undefined andalso ResW =:= 1000))
  409. end || {{Ch, W, _}, {ResC, ResW}} <- lists:zip(L, ResL)],
  410. [true] =:= lists:usort(CheckedL)
  411. end).
  412. parse_accept_charset_test_() ->
  413. Tests = [
  414. {<<"iso-8859-5, unicode-1-1;q=0.8">>, [
  415. {<<"iso-8859-5">>, 1000},
  416. {<<"unicode-1-1">>, 800}
  417. ]},
  418. %% Some user agents send this invalid value for the Accept-Charset header
  419. {<<"ISO-8859-1;utf-8;q=0.7,*;q=0.7">>, [
  420. {<<"iso-8859-1">>, 1000},
  421. {<<"utf-8">>, 700},
  422. {<<"*">>, 700}
  423. ]}
  424. ],
  425. [{V, fun() -> R = parse_accept_charset(V) end} || {V, R} <- Tests].
  426. parse_accept_charset_error_test_() ->
  427. Tests = [
  428. <<>>
  429. ],
  430. [{V, fun() -> {'EXIT', _} = (catch parse_accept_charset(V)) end} || V <- Tests].
  431. horse_parse_accept_charset() ->
  432. horse:repeat(20000,
  433. parse_accept_charset(<<"iso-8859-5, unicode-1-1;q=0.8">>)
  434. ).
  435. -endif.
  436. %% @doc Parse the Accept-Encoding header.
  437. -spec parse_accept_encoding(binary()) -> [{binary(), qvalue()}].
  438. parse_accept_encoding(Encoding) ->
  439. conneg_list(Encoding, []).
  440. -ifdef(TEST).
  441. accept_encoding() ->
  442. ?LET({E, W},
  443. {token(), weight()},
  444. {E, W, iolist_to_binary([E, case W of
  445. undefined -> [];
  446. _ -> [<<";q=">>, qvalue_to_iodata(W)]
  447. end])}
  448. ).
  449. %% @todo This property seems useless, see prop_accept_charset.
  450. prop_parse_accept_encoding() ->
  451. ?FORALL(L,
  452. non_empty(list(accept_encoding())),
  453. begin
  454. << _, AcceptEncoding/binary >> = iolist_to_binary([[$,, A] || {_, _, A} <- L]),
  455. ResL = parse_accept_encoding(AcceptEncoding),
  456. CheckedL = [begin
  457. ResE =:= ?LOWER(E)
  458. andalso (ResW =:= W orelse (W =:= undefined andalso ResW =:= 1000))
  459. end || {{E, W, _}, {ResE, ResW}} <- lists:zip(L, ResL)],
  460. [true] =:= lists:usort(CheckedL)
  461. end).
  462. parse_accept_encoding_test_() ->
  463. Tests = [
  464. {<<>>, []},
  465. {<<"*">>, [{<<"*">>, 1000}]},
  466. {<<"compress, gzip">>, [
  467. {<<"compress">>, 1000},
  468. {<<"gzip">>, 1000}
  469. ]},
  470. {<<"compress;q=0.5, gzip;q=1.0">>, [
  471. {<<"compress">>, 500},
  472. {<<"gzip">>, 1000}
  473. ]},
  474. {<<"gzip;q=1.0, identity; q=0.5, *;q=0">>, [
  475. {<<"gzip">>, 1000},
  476. {<<"identity">>, 500},
  477. {<<"*">>, 0}
  478. ]}
  479. ],
  480. [{V, fun() -> R = parse_accept_encoding(V) end} || {V, R} <- Tests].
  481. horse_parse_accept_encoding() ->
  482. horse:repeat(20000,
  483. parse_accept_encoding(<<"gzip;q=1.0, identity; q=0.5, *;q=0">>)
  484. ).
  485. -endif.
  486. %% @doc Parse the Accept-Language header.
  487. -spec parse_accept_language(binary()) -> [{binary(), qvalue()}].
  488. parse_accept_language(LanguageRange) ->
  489. nonempty(language_range_list(LanguageRange, [])).
  490. language_range_list(<<>>, Acc) -> lists:reverse(Acc);
  491. language_range_list(<< C, R/bits >>, Acc) when ?IS_WS_COMMA(C) -> language_range_list(R, Acc);
  492. language_range_list(<< $*, R/bits >>, Acc) -> language_range_param_sep(R, Acc, <<"*">>);
  493. language_range_list(<< C, R/bits >>, Acc) when ?IS_ALPHA(C) ->
  494. ?LOWER(language_range, R, Acc, 1, <<>>).
  495. language_range(<< $-, C, R/bits >>, Acc, _, T) when ?IS_ALPHANUM(C) ->
  496. ?LOWER(language_range_sub, R, Acc, 1, << T/binary, $- >>);
  497. language_range(<< C, R/bits >>, Acc, N, T) when ?IS_ALPHA(C), N < 8 ->
  498. ?LOWER(language_range, R, Acc, N + 1, T);
  499. language_range(R, Acc, _, T) -> language_range_param_sep(R, Acc, T).
  500. language_range_sub(<< $-, R/bits >>, Acc, _, T) -> language_range_sub(R, Acc, 0, << T/binary, $- >>);
  501. language_range_sub(<< C, R/bits >>, Acc, N, T) when ?IS_ALPHANUM(C), N < 8 ->
  502. ?LOWER(language_range_sub, R, Acc, N + 1, T);
  503. language_range_sub(R, Acc, _, T) -> language_range_param_sep(R, Acc, T).
  504. language_range_param_sep(<<>>, Acc, T) -> lists:reverse([{T, 1000}|Acc]);
  505. language_range_param_sep(<< $,, R/bits >>, Acc, T) -> language_range_list(R, [{T, 1000}|Acc]);
  506. language_range_param_sep(<< $;, R/bits >>, Acc, T) -> language_range_before_weight(R, Acc, T);
  507. language_range_param_sep(<< C, R/bits >>, Acc, T) when ?IS_WS(C) -> language_range_param_sep(R, Acc, T).
  508. language_range_before_weight(<< C, R/bits >>, Acc, T) when ?IS_WS(C) -> language_range_before_weight(R, Acc, T);
  509. language_range_before_weight(<< $q, $=, R/bits >>, Acc, T) -> language_range_weight(R, Acc, T);
  510. %% Special clause for broken user agents that confuse ; and , separators.
  511. language_range_before_weight(<< C, R/bits >>, Acc, T) when ?IS_ALPHA(C) ->
  512. ?LOWER(language_range, R, [{T, 1000}|Acc], 1, <<>>).
  513. language_range_weight(<< "1.000", R/bits >>, Acc, T) -> language_range_list_sep(R, [{T, 1000}|Acc]);
  514. language_range_weight(<< "1.00", R/bits >>, Acc, T) -> language_range_list_sep(R, [{T, 1000}|Acc]);
  515. language_range_weight(<< "1.0", R/bits >>, Acc, T) -> language_range_list_sep(R, [{T, 1000}|Acc]);
  516. language_range_weight(<< "1.", R/bits >>, Acc, T) -> language_range_list_sep(R, [{T, 1000}|Acc]);
  517. language_range_weight(<< "1", R/bits >>, Acc, T) -> language_range_list_sep(R, [{T, 1000}|Acc]);
  518. language_range_weight(<< "0.", A, B, C, R/bits >>, Acc, T) when ?IS_DIGIT(A), ?IS_DIGIT(B), ?IS_DIGIT(C) ->
  519. language_range_list_sep(R, [{T, (A - $0) * 100 + (B - $0) * 10 + (C - $0)}|Acc]);
  520. language_range_weight(<< "0.", A, B, R/bits >>, Acc, T) when ?IS_DIGIT(A), ?IS_DIGIT(B) ->
  521. language_range_list_sep(R, [{T, (A - $0) * 100 + (B - $0) * 10}|Acc]);
  522. language_range_weight(<< "0.", A, R/bits >>, Acc, T) when ?IS_DIGIT(A) ->
  523. language_range_list_sep(R, [{T, (A - $0) * 100}|Acc]);
  524. language_range_weight(<< "0.", R/bits >>, Acc, T) -> language_range_list_sep(R, [{T, 0}|Acc]);
  525. language_range_weight(<< "0", R/bits >>, Acc, T) -> language_range_list_sep(R, [{T, 0}|Acc]).
  526. language_range_list_sep(<<>>, Acc) -> lists:reverse(Acc);
  527. language_range_list_sep(<< C, R/bits >>, Acc) when ?IS_WS(C) -> language_range_list_sep(R, Acc);
  528. language_range_list_sep(<< $,, R/bits >>, Acc) -> language_range_list(R, Acc).
  529. -ifdef(TEST).
  530. language_range_tag() ->
  531. vector(1, 8, alpha()).
  532. language_range_subtag() ->
  533. [$-, vector(1, 8, alphanum())].
  534. language_range() ->
  535. [language_range_tag(), small_list(language_range_subtag())].
  536. accept_language() ->
  537. ?LET({R, W},
  538. {language_range(), weight()},
  539. {iolist_to_binary(R), W, iolist_to_binary([R, case W of
  540. undefined -> [];
  541. _ -> [<<";q=">>, qvalue_to_iodata(W)]
  542. end])}
  543. ).
  544. prop_parse_accept_language() ->
  545. ?FORALL(L,
  546. non_empty(list(accept_language())),
  547. begin
  548. << _, AcceptLanguage/binary >> = iolist_to_binary([[$,, A] || {_, _, A} <- L]),
  549. ResL = parse_accept_language(AcceptLanguage),
  550. CheckedL = [begin
  551. ResR =:= ?LOWER(R)
  552. andalso (ResW =:= W orelse (W =:= undefined andalso ResW =:= 1000))
  553. end || {{R, W, _}, {ResR, ResW}} <- lists:zip(L, ResL)],
  554. [true] =:= lists:usort(CheckedL)
  555. end).
  556. parse_accept_language_test_() ->
  557. Tests = [
  558. {<<"da, en-gb;q=0.8, en;q=0.7">>, [
  559. {<<"da">>, 1000},
  560. {<<"en-gb">>, 800},
  561. {<<"en">>, 700}
  562. ]},
  563. {<<"en, en-US, en-cockney, i-cherokee, x-pig-latin, es-419">>, [
  564. {<<"en">>, 1000},
  565. {<<"en-us">>, 1000},
  566. {<<"en-cockney">>, 1000},
  567. {<<"i-cherokee">>, 1000},
  568. {<<"x-pig-latin">>, 1000},
  569. {<<"es-419">>, 1000}
  570. ]}
  571. ],
  572. [{V, fun() -> R = parse_accept_language(V) end} || {V, R} <- Tests].
  573. parse_accept_language_error_test_() ->
  574. Tests = [
  575. <<>>,
  576. <<"loooooong">>,
  577. <<"en-us-loooooong">>,
  578. <<"419-en-us">>
  579. ],
  580. [{V, fun() -> {'EXIT', _} = (catch parse_accept_language(V)) end} || V <- Tests].
  581. horse_parse_accept_language() ->
  582. horse:repeat(20000,
  583. parse_accept_language(<<"da, en-gb;q=0.8, en;q=0.7">>)
  584. ).
  585. -endif.
  586. %% @doc Parse the Accept-Ranges header.
  587. -spec parse_accept_ranges(binary()) -> [binary()].
  588. parse_accept_ranges(<<"none">>) -> [];
  589. parse_accept_ranges(<<"bytes">>) -> [<<"bytes">>];
  590. parse_accept_ranges(AcceptRanges) ->
  591. nonempty(token_ci_list(AcceptRanges, [])).
  592. -ifdef(TEST).
  593. parse_accept_ranges_test_() ->
  594. Tests = [
  595. {<<"bytes">>, [<<"bytes">>]},
  596. {<<"none">>, []},
  597. {<<"bytes, pages, kilos">>, [<<"bytes">>, <<"pages">>, <<"kilos">>]}
  598. ],
  599. [{V, fun() -> R = parse_accept_ranges(V) end} || {V, R} <- Tests].
  600. parse_accept_ranges_error_test_() ->
  601. Tests = [
  602. <<>>
  603. ],
  604. [{V, fun() -> {'EXIT', _} = (catch parse_accept_ranges(V)) end} || V <- Tests].
  605. horse_parse_accept_ranges_none() ->
  606. horse:repeat(200000,
  607. parse_accept_ranges(<<"none">>)
  608. ).
  609. horse_parse_accept_ranges_bytes() ->
  610. horse:repeat(200000,
  611. parse_accept_ranges(<<"bytes">>)
  612. ).
  613. horse_parse_accept_ranges_other() ->
  614. horse:repeat(200000,
  615. parse_accept_ranges(<<"bytes, pages, kilos">>)
  616. ).
  617. -endif.
  618. %% @doc Parse the Access-Control-Request-Headers header.
  619. -spec parse_access_control_request_headers(binary()) -> [binary()].
  620. parse_access_control_request_headers(Headers) ->
  621. token_ci_list(Headers, []).
  622. -ifdef(TEST).
  623. headers() ->
  624. ?LET(L,
  625. list({ows(), ows(), token()}),
  626. case L of
  627. [] -> {[], <<>>};
  628. _ ->
  629. << _, Headers/binary >> = iolist_to_binary([[OWS1, $,, OWS2, M] || {OWS1, OWS2, M} <- L]),
  630. {[?LOWER(M) || {_, _, M} <- L], Headers}
  631. end).
  632. prop_parse_access_control_request_headers() ->
  633. ?FORALL({L, Headers},
  634. headers(),
  635. L =:= parse_access_control_request_headers(Headers)).
  636. parse_access_control_request_headers_test_() ->
  637. Tests = [
  638. {<<>>, []},
  639. {<<"Content-Type">>, [<<"content-type">>]},
  640. {<<"accept, authorization, content-type">>, [<<"accept">>, <<"authorization">>, <<"content-type">>]},
  641. {<<"accept,, , authorization,content-type">>, [<<"accept">>, <<"authorization">>, <<"content-type">>]}
  642. ],
  643. [{V, fun() -> R = parse_access_control_request_headers(V) end} || {V, R} <- Tests].
  644. horse_parse_access_control_request_headers() ->
  645. horse:repeat(200000,
  646. parse_access_control_request_headers(<<"accept, authorization, content-type">>)
  647. ).
  648. -endif.
  649. %% @doc Parse the Access-Control-Request-Method header.
  650. -spec parse_access_control_request_method(binary()) -> binary().
  651. parse_access_control_request_method(Method) ->
  652. true = <<>> =/= Method,
  653. ok = validate_token(Method),
  654. Method.
  655. validate_token(<< C, R/bits >>) when ?IS_TOKEN(C) -> validate_token(R);
  656. validate_token(<<>>) -> ok.
  657. -ifdef(TEST).
  658. parse_access_control_request_method_test_() ->
  659. Tests = [
  660. <<"GET">>,
  661. <<"HEAD">>,
  662. <<"POST">>,
  663. <<"PUT">>,
  664. <<"DELETE">>,
  665. <<"TRACE">>,
  666. <<"CONNECT">>,
  667. <<"whatever">>
  668. ],
  669. [{V, fun() -> R = parse_access_control_request_method(V) end} || {V, R} <- Tests].
  670. parse_access_control_request_method_error_test_() ->
  671. Tests = [
  672. <<>>
  673. ],
  674. [{V, fun() -> {'EXIT', _} = (catch parse_access_control_request_method(V)) end} || V <- Tests].
  675. horse_parse_access_control_request_method() ->
  676. horse:repeat(200000,
  677. parse_access_control_request_method(<<"POST">>)
  678. ).
  679. -endif.
  680. %% @doc Parse the Age header.
  681. -spec parse_age(binary()) -> non_neg_integer().
  682. parse_age(Age) ->
  683. I = binary_to_integer(Age),
  684. true = I >= 0,
  685. I.
  686. -ifdef(TEST).
  687. parse_age_test_() ->
  688. Tests = [
  689. {<<"0">>, 0},
  690. {<<"42">>, 42},
  691. {<<"69">>, 69},
  692. {<<"1337">>, 1337},
  693. {<<"3495">>, 3495},
  694. {<<"1234567890">>, 1234567890}
  695. ],
  696. [{V, fun() -> R = parse_age(V) end} || {V, R} <- Tests].
  697. parse_age_error_test_() ->
  698. Tests = [
  699. <<>>,
  700. <<"123, 123">>,
  701. <<"4.17">>
  702. ],
  703. [{V, fun() -> {'EXIT', _} = (catch parse_age(V)) end} || V <- Tests].
  704. -endif.
  705. %% @doc Parse the Allow header.
  706. -spec parse_allow(binary()) -> [binary()].
  707. parse_allow(Allow) ->
  708. token_list(Allow, []).
  709. -ifdef(TEST).
  710. allow() ->
  711. ?LET(L,
  712. list({ows(), ows(), token()}),
  713. case L of
  714. [] -> {[], <<>>};
  715. _ ->
  716. << _, Allow/binary >> = iolist_to_binary([[OWS1, $,, OWS2, M] || {OWS1, OWS2, M} <- L]),
  717. {[M || {_, _, M} <- L], Allow}
  718. end).
  719. prop_parse_allow() ->
  720. ?FORALL({L, Allow},
  721. allow(),
  722. L =:= parse_allow(Allow)).
  723. parse_allow_test_() ->
  724. Tests = [
  725. {<<>>, []},
  726. {<<"GET, HEAD, PUT">>, [<<"GET">>, <<"HEAD">>, <<"PUT">>]}
  727. ],
  728. [{V, fun() -> R = parse_allow(V) end} || {V, R} <- Tests].
  729. horse_parse_allow() ->
  730. horse:repeat(200000,
  731. parse_allow(<<"GET, HEAD, PUT">>)
  732. ).
  733. -endif.
  734. %% @doc Parse the Authorization header.
  735. %%
  736. %% We support Basic, Digest and Bearer schemes only.
  737. %%
  738. %% In the Digest case we do not validate that the mandatory
  739. %% fields are present. When parsing auth-params, we do not
  740. %% accept BWS characters around the "=".
  741. -spec parse_authorization(binary())
  742. -> {basic, binary(), binary()}
  743. | {bearer, binary()}
  744. | {digest, [{binary(), binary()}]}.
  745. parse_authorization(<<"Basic ", R/bits >>) ->
  746. auth_basic(base64:decode(R), <<>>);
  747. parse_authorization(<<"Bearer ", R/bits >>) when R =/= <<>> ->
  748. validate_auth_bearer(R),
  749. {bearer, R};
  750. parse_authorization(<<"Digest ", R/bits >>) ->
  751. {digest, nonempty(auth_digest_list(R, []))}.
  752. auth_basic(<< $:, Password/bits >>, UserID) -> {basic, UserID, Password};
  753. auth_basic(<< C, R/bits >>, UserID) -> auth_basic(R, << UserID/binary, C >>).
  754. validate_auth_bearer(<< C, R/bits >>) when ?IS_TOKEN68(C) -> validate_auth_bearer(R);
  755. validate_auth_bearer(<< $=, R/bits >>) -> validate_auth_bearer_eq(R);
  756. validate_auth_bearer(<<>>) -> ok.
  757. validate_auth_bearer_eq(<< $=, R/bits >>) -> validate_auth_bearer_eq(R);
  758. validate_auth_bearer_eq(<<>>) -> ok.
  759. auth_digest_list(<<>>, Acc) -> lists:reverse(Acc);
  760. auth_digest_list(<< C, R/bits >>, Acc) when ?IS_WS_COMMA(C) -> auth_digest_list(R, Acc);
  761. auth_digest_list(<< "algorithm=", C, R/bits >>, Acc) when ?IS_TOKEN(C) -> auth_digest_token(R, Acc, <<"algorithm">>, << C >>);
  762. auth_digest_list(<< "cnonce=\"", R/bits >>, Acc) -> auth_digest_quoted(R, Acc, <<"cnonce">>, <<>>);
  763. auth_digest_list(<< "nc=", A, B, C, D, E, F, G, H, R/bits >>, Acc)
  764. when ?IS_LHEX(A), ?IS_LHEX(B), ?IS_LHEX(C), ?IS_LHEX(D),
  765. ?IS_LHEX(E), ?IS_LHEX(F), ?IS_LHEX(G), ?IS_LHEX(H) ->
  766. auth_digest_list_sep(R, [{<<"nc">>, << A, B, C, D, E, F, G, H >>}|Acc]);
  767. auth_digest_list(<< "nonce=\"", R/bits >>, Acc) -> auth_digest_quoted(R, Acc, <<"nonce">>, <<>>);
  768. auth_digest_list(<< "opaque=\"", R/bits >>, Acc) -> auth_digest_quoted(R, Acc, <<"opaque">>, <<>>);
  769. auth_digest_list(<< "qop=", C, R/bits >>, Acc) when ?IS_TOKEN(C) -> auth_digest_token(R, Acc, <<"qop">>, << C >>);
  770. auth_digest_list(<< "realm=\"", R/bits >>, Acc) -> auth_digest_quoted(R, Acc, <<"realm">>, <<>>);
  771. auth_digest_list(<< "response=\"", R/bits >>, Acc) -> auth_digest_quoted(R, Acc, <<"response">>, <<>>);
  772. auth_digest_list(<< "uri=\"", R/bits >>, Acc) -> auth_digest_quoted(R, Acc, <<"uri">>, <<>>);
  773. auth_digest_list(<< "username=\"", R/bits >>, Acc) -> auth_digest_quoted(R, Acc, <<"username">>, <<>>);
  774. auth_digest_list(<< C, R/bits >>, Acc) when ?IS_TOKEN(C) ->
  775. ?LOWER(auth_digest_param, R, Acc, <<>>).
  776. auth_digest_param(<< $=, $", R/bits >>, Acc, K) -> auth_digest_quoted(R, Acc, K, <<>>);
  777. auth_digest_param(<< $=, C, R/bits >>, Acc, K) when ?IS_TOKEN(C) -> auth_digest_token(R, Acc, K, << C >>);
  778. auth_digest_param(<< C, R/bits >>, Acc, K) when ?IS_TOKEN(C) ->
  779. ?LOWER(auth_digest_param, R, Acc, K).
  780. auth_digest_token(<< C, R/bits >>, Acc, K, V) when ?IS_TOKEN(C) -> auth_digest_token(R, Acc, K, << V/binary, C >>);
  781. auth_digest_token(R, Acc, K, V) -> auth_digest_list_sep(R, [{K, V}|Acc]).
  782. auth_digest_quoted(<< $", R/bits >>, Acc, K, V) -> auth_digest_list_sep(R, [{K, V}|Acc]);
  783. auth_digest_quoted(<< $\\, C, R/bits >>, Acc, K, V) when ?IS_VCHAR_OBS(C) -> auth_digest_quoted(R, Acc, K, << V/binary, C >>);
  784. auth_digest_quoted(<< C, R/bits >>, Acc, K, V) when ?IS_VCHAR_OBS(C) -> auth_digest_quoted(R, Acc, K, << V/binary, C >>).
  785. auth_digest_list_sep(<<>>, Acc) -> lists:reverse(Acc);
  786. auth_digest_list_sep(<< $,, R/bits >>, Acc) -> auth_digest_list(R, Acc);
  787. auth_digest_list_sep(<< C, R/bits >>, Acc) when ?IS_WS(C) -> auth_digest_list_sep(R, Acc).
  788. -ifdef(TEST).
  789. parse_authorization_test_() ->
  790. Tests = [
  791. {<<"Basic QWxhZGRpbjpvcGVuIHNlc2FtZQ==">>, {basic, <<"Aladdin">>, <<"open sesame">>}},
  792. {<<"Bearer mF_9.B5f-4.1JqM">>, {bearer, <<"mF_9.B5f-4.1JqM">>}},
  793. {<<"Digest username=\"Mufasa\","
  794. "realm=\"testrealm@host.com\","
  795. "nonce=\"dcd98b7102dd2f0e8b11d0f600bfb0c093\","
  796. "uri=\"/dir/index.html\","
  797. "qop=auth,"
  798. "nc=00000001,"
  799. "cnonce=\"0a4f113b\","
  800. "response=\"6629fae49393a05397450978507c4ef1\","
  801. "opaque=\"5ccc069c403ebaf9f0171e9517f40e41\"">>,
  802. {digest, [
  803. {<<"username">>, <<"Mufasa">>},
  804. {<<"realm">>, <<"testrealm@host.com">>},
  805. {<<"nonce">>, <<"dcd98b7102dd2f0e8b11d0f600bfb0c093">>},
  806. {<<"uri">>, <<"/dir/index.html">>},
  807. {<<"qop">>, <<"auth">>},
  808. {<<"nc">>, <<"00000001">>},
  809. {<<"cnonce">>, <<"0a4f113b">>},
  810. {<<"response">>, <<"6629fae49393a05397450978507c4ef1">>},
  811. {<<"opaque">>, <<"5ccc069c403ebaf9f0171e9517f40e41">>}]}}
  812. ],
  813. [{V, fun() -> R = parse_authorization(V) end} || {V, R} <- Tests].
  814. horse_parse_authorization_basic() ->
  815. horse:repeat(20000,
  816. parse_authorization(<<"Basic QWxhZGRpbjpvcGVuIHNlc2FtZQ==">>)
  817. ).
  818. horse_parse_authorization_bearer() ->
  819. horse:repeat(20000,
  820. parse_authorization(<<"Bearer mF_9.B5f-4.1JqM">>)
  821. ).
  822. horse_parse_authorization_digest() ->
  823. horse:repeat(20000,
  824. parse_authorization(
  825. <<"Digest username=\"Mufasa\","
  826. "realm=\"testrealm@host.com\","
  827. "nonce=\"dcd98b7102dd2f0e8b11d0f600bfb0c093\","
  828. "uri=\"/dir/index.html\","
  829. "qop=auth,"
  830. "nc=00000001,"
  831. "cnonce=\"0a4f113b\","
  832. "response=\"6629fae49393a05397450978507c4ef1\","
  833. "opaque=\"5ccc069c403ebaf9f0171e9517f40e41\"">>)
  834. ).
  835. -endif.
  836. %% @doc Parse the Cache-Control header.
  837. %%
  838. %% In the fields list case, we do not support escaping, which shouldn't be needed anyway.
  839. -spec parse_cache_control(binary())
  840. -> [binary() | {binary(), binary()} | {binary(), non_neg_integer()} | {binary(), [binary()]}].
  841. parse_cache_control(<<"no-cache">>) ->
  842. [<<"no-cache">>];
  843. parse_cache_control(<<"max-age=0">>) ->
  844. [{<<"max-age">>, 0}];
  845. parse_cache_control(CacheControl) ->
  846. nonempty(cache_directive_list(CacheControl, [])).
  847. cache_directive_list(<<>>, Acc) -> lists:reverse(Acc);
  848. cache_directive_list(<< C, R/bits >>, Acc) when ?IS_WS_COMMA(C)-> cache_directive_list(R, Acc);
  849. cache_directive_list(<< C, R/bits >>, Acc) when ?IS_TOKEN(C) ->
  850. ?LOWER(cache_directive, R, Acc, <<>>).
  851. cache_directive(<< $=, $", R/bits >>, Acc, T)
  852. when (T =:= <<"no-cache">>) or (T =:= <<"private">>) ->
  853. cache_directive_fields_list(R, Acc, T, []);
  854. cache_directive(<< $=, C, R/bits >>, Acc, T)
  855. when ?IS_DIGIT(C), (T =:= <<"max-age">>) or (T =:= <<"max-stale">>)
  856. or (T =:= <<"min-fresh">>) or (T =:= <<"s-maxage">>) ->
  857. cache_directive_delta(R, Acc, T, (C - $0));
  858. cache_directive(<< $=, $", R/bits >>, Acc, T) -> cache_directive_quoted_string(R, Acc, T, <<>>);
  859. cache_directive(<< $=, C, R/bits >>, Acc, T) when ?IS_TOKEN(C) -> cache_directive_token(R, Acc, T, << C >>);
  860. cache_directive(<< C, R/bits >>, Acc, T) when ?IS_TOKEN(C) ->
  861. ?LOWER(cache_directive, R, Acc, T);
  862. cache_directive(R, Acc, T) -> cache_directive_list_sep(R, [T|Acc]).
  863. cache_directive_delta(<< C, R/bits >>, Acc, K, V) when ?IS_DIGIT(C) -> cache_directive_delta(R, Acc, K, V * 10 + (C - $0));
  864. cache_directive_delta(R, Acc, K, V) -> cache_directive_list_sep(R, [{K, V}|Acc]).
  865. cache_directive_fields_list(<< C, R/bits >>, Acc, K, L) when ?IS_WS_COMMA(C) -> cache_directive_fields_list(R, Acc, K, L);
  866. cache_directive_fields_list(<< $", R/bits >>, Acc, K, L) -> cache_directive_list_sep(R, [{K, lists:reverse(L)}|Acc]);
  867. cache_directive_fields_list(<< C, R/bits >>, Acc, K, L) when ?IS_TOKEN(C) ->
  868. ?LOWER(cache_directive_field, R, Acc, K, L, <<>>).
  869. cache_directive_field(<< C, R/bits >>, Acc, K, L, F) when ?IS_TOKEN(C) ->
  870. ?LOWER(cache_directive_field, R, Acc, K, L, F);
  871. cache_directive_field(R, Acc, K, L, F) -> cache_directive_fields_list_sep(R, Acc, K, [F|L]).
  872. cache_directive_fields_list_sep(<< C, R/bits >>, Acc, K, L) when ?IS_WS(C) -> cache_directive_fields_list_sep(R, Acc, K, L);
  873. cache_directive_fields_list_sep(<< $,, R/bits >>, Acc, K, L) -> cache_directive_fields_list(R, Acc, K, L);
  874. cache_directive_fields_list_sep(<< $", R/bits >>, Acc, K, L) -> cache_directive_list_sep(R, [{K, lists:reverse(L)}|Acc]).
  875. cache_directive_token(<< C, R/bits >>, Acc, K, V) when ?IS_TOKEN(C) -> cache_directive_token(R, Acc, K, << V/binary, C >>);
  876. cache_directive_token(R, Acc, K, V) -> cache_directive_list_sep(R, [{K, V}|Acc]).
  877. cache_directive_quoted_string(<< $", R/bits >>, Acc, K, V) -> cache_directive_list_sep(R, [{K, V}|Acc]);
  878. cache_directive_quoted_string(<< $\\, C, R/bits >>, Acc, K, V) when ?IS_VCHAR_OBS(C) ->
  879. cache_directive_quoted_string(R, Acc, K, << V/binary, C >>);
  880. cache_directive_quoted_string(<< C, R/bits >>, Acc, K, V) when ?IS_VCHAR_OBS(C) ->
  881. cache_directive_quoted_string(R, Acc, K, << V/binary, C >>).
  882. cache_directive_list_sep(<<>>, Acc) -> lists:reverse(Acc);
  883. cache_directive_list_sep(<< C, R/bits >>, Acc) when ?IS_WS(C) -> cache_directive_list_sep(R, Acc);
  884. cache_directive_list_sep(<< $,, R/bits >>, Acc) -> cache_directive_list(R, Acc).
  885. -ifdef(TEST).
  886. cache_directive_unreserved_token() ->
  887. ?SUCHTHAT(T,
  888. token(),
  889. T =/= <<"max-age">> andalso T =/= <<"max-stale">> andalso T =/= <<"min-fresh">>
  890. andalso T =/= <<"s-maxage">> andalso T =/= <<"no-cache">> andalso T =/= <<"private">>).
  891. cache_directive() ->
  892. oneof([
  893. token(),
  894. {cache_directive_unreserved_token(), token()},
  895. {cache_directive_unreserved_token(), quoted_string()},
  896. {elements([<<"max-age">>, <<"max-stale">>, <<"min-fresh">>, <<"s-maxage">>]), non_neg_integer()},
  897. {fields, elements([<<"no-cache">>, <<"private">>]), small_list(token())}
  898. ]).
  899. cache_control() ->
  900. ?LET(L,
  901. non_empty(list(cache_directive())),
  902. begin
  903. << _, CacheControl/binary >> = iolist_to_binary([[$,,
  904. case C of
  905. {fields, K, V} -> [K, $=, $", [[F, $,] || F <- V], $"];
  906. {K, V} when is_integer(V) -> [K, $=, integer_to_binary(V)];
  907. {K, V} -> [K, $=, V];
  908. K -> K
  909. end] || C <- L]),
  910. {L, CacheControl}
  911. end).
  912. prop_parse_cache_control() ->
  913. ?FORALL({L, CacheControl},
  914. cache_control(),
  915. begin
  916. ResL = parse_cache_control(CacheControl),
  917. CheckedL = [begin
  918. ExpectedCc = case Cc of
  919. {fields, K, V} -> {?LOWER(K), [?LOWER(F) || F <- V]};
  920. {K, V} -> {?LOWER(K), unquote(V)};
  921. K -> ?LOWER(K)
  922. end,
  923. ExpectedCc =:= ResCc
  924. end || {Cc, ResCc} <- lists:zip(L, ResL)],
  925. [true] =:= lists:usort(CheckedL)
  926. end).
  927. parse_cache_control_test_() ->
  928. Tests = [
  929. {<<"no-cache">>, [<<"no-cache">>]},
  930. {<<"no-store">>, [<<"no-store">>]},
  931. {<<"max-age=0">>, [{<<"max-age">>, 0}]},
  932. {<<"max-age=30">>, [{<<"max-age">>, 30}]},
  933. {<<"private, community=\"UCI\"">>, [<<"private">>, {<<"community">>, <<"UCI">>}]},
  934. {<<"private=\"Content-Type, Content-Encoding, Content-Language\"">>,
  935. [{<<"private">>, [<<"content-type">>, <<"content-encoding">>, <<"content-language">>]}]}
  936. ],
  937. [{V, fun() -> R = parse_cache_control(V) end} || {V, R} <- Tests].
  938. parse_cache_control_error_test_() ->
  939. Tests = [
  940. <<>>
  941. ],
  942. [{V, fun() -> {'EXIT', _} = (catch parse_cache_control(V)) end} || V <- Tests].
  943. horse_parse_cache_control_no_cache() ->
  944. horse:repeat(200000,
  945. parse_cache_control(<<"no-cache">>)
  946. ).
  947. horse_parse_cache_control_max_age_0() ->
  948. horse:repeat(200000,
  949. parse_cache_control(<<"max-age=0">>)
  950. ).
  951. horse_parse_cache_control_max_age_30() ->
  952. horse:repeat(200000,
  953. parse_cache_control(<<"max-age=30">>)
  954. ).
  955. horse_parse_cache_control_custom() ->
  956. horse:repeat(200000,
  957. parse_cache_control(<<"private, community=\"UCI\"">>)
  958. ).
  959. horse_parse_cache_control_fields() ->
  960. horse:repeat(200000,
  961. parse_cache_control(<<"private=\"Content-Type, Content-Encoding, Content-Language\"">>)
  962. ).
  963. -endif.
  964. %% @doc Parse the Connection header.
  965. -spec parse_connection(binary()) -> [binary()].
  966. parse_connection(<<"close">>) ->
  967. [<<"close">>];
  968. parse_connection(<<"keep-alive">>) ->
  969. [<<"keep-alive">>];
  970. parse_connection(Connection) ->
  971. nonempty(token_ci_list(Connection, [])).
  972. -ifdef(TEST).
  973. prop_parse_connection() ->
  974. ?FORALL(L,
  975. non_empty(list(token())),
  976. begin
  977. << _, Connection/binary >> = iolist_to_binary([[$,, C] || C <- L]),
  978. ResL = parse_connection(Connection),
  979. CheckedL = [?LOWER(Co) =:= ResC || {Co, ResC} <- lists:zip(L, ResL)],
  980. [true] =:= lists:usort(CheckedL)
  981. end).
  982. parse_connection_test_() ->
  983. Tests = [
  984. {<<"close">>, [<<"close">>]},
  985. {<<"ClOsE">>, [<<"close">>]},
  986. {<<"Keep-Alive">>, [<<"keep-alive">>]},
  987. {<<"keep-alive, Upgrade">>, [<<"keep-alive">>, <<"upgrade">>]}
  988. ],
  989. [{V, fun() -> R = parse_connection(V) end} || {V, R} <- Tests].
  990. parse_connection_error_test_() ->
  991. Tests = [
  992. <<>>
  993. ],
  994. [{V, fun() -> {'EXIT', _} = (catch parse_connection(V)) end} || V <- Tests].
  995. horse_parse_connection_close() ->
  996. horse:repeat(200000,
  997. parse_connection(<<"close">>)
  998. ).
  999. horse_parse_connection_keepalive() ->
  1000. horse:repeat(200000,
  1001. parse_connection(<<"keep-alive">>)
  1002. ).
  1003. horse_parse_connection_keepalive_upgrade() ->
  1004. horse:repeat(200000,
  1005. parse_connection(<<"keep-alive, upgrade">>)
  1006. ).
  1007. -endif.
  1008. %% @doc Parse the Content-Encoding header.
  1009. -spec parse_content_encoding(binary()) -> [binary()].
  1010. parse_content_encoding(ContentEncoding) ->
  1011. nonempty(token_ci_list(ContentEncoding, [])).
  1012. -ifdef(TEST).
  1013. parse_content_encoding_test_() ->
  1014. Tests = [
  1015. {<<"gzip">>, [<<"gzip">>]}
  1016. ],
  1017. [{V, fun() -> R = parse_content_encoding(V) end} || {V, R} <- Tests].
  1018. parse_content_encoding_error_test_() ->
  1019. Tests = [
  1020. <<>>
  1021. ],
  1022. [{V, fun() -> {'EXIT', _} = (catch parse_content_encoding(V)) end} || V <- Tests].
  1023. horse_parse_content_encoding() ->
  1024. horse:repeat(200000,
  1025. parse_content_encoding(<<"gzip">>)
  1026. ).
  1027. -endif.
  1028. %% @doc Parse the Content-Language header.
  1029. %%
  1030. %% We do not support irregular deprecated tags that do not match the ABNF.
  1031. -spec parse_content_language(binary()) -> [binary()].
  1032. parse_content_language(ContentLanguage) ->
  1033. nonempty(langtag_list(ContentLanguage, [])).
  1034. langtag_list(<<>>, Acc) -> lists:reverse(Acc);
  1035. langtag_list(<< C, R/bits >>, Acc) when ?IS_WS_COMMA(C) -> langtag_list(R, Acc);
  1036. langtag_list(<< A, B, C, R/bits >>, Acc) when ?IS_ALPHA(A), ?IS_ALPHA(B), ?IS_ALPHA(C) ->
  1037. langtag_extlang(R, Acc, << ?LC(A), ?LC(B), ?LC(C) >>, 0);
  1038. langtag_list(<< A, B, R/bits >>, Acc) when ?IS_ALPHA(A), ?IS_ALPHA(B) ->
  1039. langtag_extlang(R, Acc, << ?LC(A), ?LC(B) >>, 0);
  1040. langtag_list(<< X, R/bits >>, Acc) when X =:= $x; X =:= $X -> langtag_privateuse_sub(R, Acc, << $x >>, 0).
  1041. langtag_extlang(<< $-, A, B, C, D, E, F, G, H, R/bits >>, Acc, T, _)
  1042. when ?IS_ALPHANUM(A), ?IS_ALPHANUM(B), ?IS_ALPHANUM(C), ?IS_ALPHANUM(D),
  1043. ?IS_ALPHANUM(E), ?IS_ALPHANUM(F), ?IS_ALPHANUM(G), ?IS_ALPHANUM(H) ->
  1044. langtag_variant(R, Acc, << T/binary, $-, ?LC(A), ?LC(B), ?LC(C), ?LC(D), ?LC(E), ?LC(F), ?LC(G), ?LC(H) >>);
  1045. langtag_extlang(<< $-, A, B, C, D, E, F, G, R/bits >>, Acc, T, _)
  1046. when ?IS_ALPHANUM(A), ?IS_ALPHANUM(B), ?IS_ALPHANUM(C), ?IS_ALPHANUM(D),
  1047. ?IS_ALPHANUM(E), ?IS_ALPHANUM(F), ?IS_ALPHANUM(G) ->
  1048. langtag_variant(R, Acc, << T/binary, $-, ?LC(A), ?LC(B), ?LC(C), ?LC(D), ?LC(E), ?LC(F), ?LC(G) >>);
  1049. langtag_extlang(<< $-, A, B, C, D, E, F, R/bits >>, Acc, T, _)
  1050. when ?IS_ALPHANUM(A), ?IS_ALPHANUM(B), ?IS_ALPHANUM(C), ?IS_ALPHANUM(D),
  1051. ?IS_ALPHANUM(E), ?IS_ALPHANUM(F) ->
  1052. langtag_variant(R, Acc, << T/binary, $-, ?LC(A), ?LC(B), ?LC(C), ?LC(D), ?LC(E), ?LC(F) >>);
  1053. langtag_extlang(<< $-, A, B, C, D, E, R/bits >>, Acc, T, _)
  1054. when ?IS_ALPHANUM(A), ?IS_ALPHANUM(B), ?IS_ALPHANUM(C), ?IS_ALPHANUM(D), ?IS_ALPHANUM(E) ->
  1055. langtag_variant(R, Acc, << T/binary, $-, ?LC(A), ?LC(B), ?LC(C), ?LC(D), ?LC(E) >>);
  1056. langtag_extlang(<< $-, A, B, C, D, R/bits >>, Acc, T, _)
  1057. when ?IS_ALPHA(A), ?IS_ALPHA(B), ?IS_ALPHA(C), ?IS_ALPHA(D) ->
  1058. langtag_region(R, Acc, << T/binary, $-, ?LC(A), ?LC(B), ?LC(C), ?LC(D) >>);
  1059. langtag_extlang(<< $-, A, B, C, R/bits >>, Acc, T, N)
  1060. when ?IS_ALPHA(A), ?IS_ALPHA(B), ?IS_ALPHA(C) ->
  1061. case N of
  1062. 2 -> langtag_script(R, Acc, << T/binary, $-, ?LC(A), ?LC(B), ?LC(C) >>);
  1063. _ -> langtag_extlang(R, Acc, << T/binary, $-, ?LC(A), ?LC(B), ?LC(C) >>, N + 1)
  1064. end;
  1065. langtag_extlang(R, Acc, T, _) -> langtag_region(R, Acc, T).
  1066. langtag_script(<< $-, A, B, C, D, E, F, G, H, R/bits >>, Acc, T)
  1067. when ?IS_ALPHANUM(A), ?IS_ALPHANUM(B), ?IS_ALPHANUM(C), ?IS_ALPHANUM(D),
  1068. ?IS_ALPHANUM(E), ?IS_ALPHANUM(F), ?IS_ALPHANUM(G), ?IS_ALPHANUM(H) ->
  1069. langtag_variant(R, Acc, << T/binary, $-, ?LC(A), ?LC(B), ?LC(C), ?LC(D), ?LC(E), ?LC(F), ?LC(G), ?LC(H) >>);
  1070. langtag_script(<< $-, A, B, C, D, E, F, G, R/bits >>, Acc, T)
  1071. when ?IS_ALPHANUM(A), ?IS_ALPHANUM(B), ?IS_ALPHANUM(C), ?IS_ALPHANUM(D),
  1072. ?IS_ALPHANUM(E), ?IS_ALPHANUM(F), ?IS_ALPHANUM(G) ->
  1073. langtag_variant(R, Acc, << T/binary, $-, ?LC(A), ?LC(B), ?LC(C), ?LC(D), ?LC(E), ?LC(F), ?LC(G) >>);
  1074. langtag_script(<< $-, A, B, C, D, E, F, R/bits >>, Acc, T)
  1075. when ?IS_ALPHANUM(A), ?IS_ALPHANUM(B), ?IS_ALPHANUM(C), ?IS_ALPHANUM(D),
  1076. ?IS_ALPHANUM(E), ?IS_ALPHANUM(F) ->
  1077. langtag_variant(R, Acc, << T/binary, $-, ?LC(A), ?LC(B), ?LC(C), ?LC(D), ?LC(E), ?LC(F) >>);
  1078. langtag_script(<< $-, A, B, C, D, E, R/bits >>, Acc, T)
  1079. when ?IS_ALPHANUM(A), ?IS_ALPHANUM(B), ?IS_ALPHANUM(C), ?IS_ALPHANUM(D), ?IS_ALPHANUM(E) ->
  1080. langtag_variant(R, Acc, << T/binary, $-, ?LC(A), ?LC(B), ?LC(C), ?LC(D), ?LC(E) >>);
  1081. langtag_script(<< $-, A, B, C, D, R/bits >>, Acc, T)
  1082. when ?IS_ALPHA(A), ?IS_ALPHA(B), ?IS_ALPHA(C), ?IS_ALPHA(D) ->
  1083. langtag_region(R, Acc, << T/binary, $-, ?LC(A), ?LC(B), ?LC(C), ?LC(D) >>);
  1084. langtag_script(R, Acc, T) ->
  1085. langtag_region(R, Acc, T).
  1086. langtag_region(<< $-, A, B, C, D, E, F, G, H, R/bits >>, Acc, T)
  1087. when ?IS_ALPHANUM(A), ?IS_ALPHANUM(B), ?IS_ALPHANUM(C), ?IS_ALPHANUM(D),
  1088. ?IS_ALPHANUM(E), ?IS_ALPHANUM(F), ?IS_ALPHANUM(G), ?IS_ALPHANUM(H) ->
  1089. langtag_variant(R, Acc, << T/binary, $-, ?LC(A), ?LC(B), ?LC(C), ?LC(D), ?LC(E), ?LC(F), ?LC(G), ?LC(H) >>);
  1090. langtag_region(<< $-, A, B, C, D, E, F, G, R/bits >>, Acc, T)
  1091. when ?IS_ALPHANUM(A), ?IS_ALPHANUM(B), ?IS_ALPHANUM(C), ?IS_ALPHANUM(D),
  1092. ?IS_ALPHANUM(E), ?IS_ALPHANUM(F), ?IS_ALPHANUM(G) ->
  1093. langtag_variant(R, Acc, << T/binary, $-, ?LC(A), ?LC(B), ?LC(C), ?LC(D), ?LC(E), ?LC(F), ?LC(G) >>);
  1094. langtag_region(<< $-, A, B, C, D, E, F, R/bits >>, Acc, T)
  1095. when ?IS_ALPHANUM(A), ?IS_ALPHANUM(B), ?IS_ALPHANUM(C), ?IS_ALPHANUM(D),
  1096. ?IS_ALPHANUM(E), ?IS_ALPHANUM(F) ->
  1097. langtag_variant(R, Acc, << T/binary, $-, ?LC(A), ?LC(B), ?LC(C), ?LC(D), ?LC(E), ?LC(F) >>);
  1098. langtag_region(<< $-, A, B, C, D, E, R/bits >>, Acc, T)
  1099. when ?IS_ALPHANUM(A), ?IS_ALPHANUM(B), ?IS_ALPHANUM(C), ?IS_ALPHANUM(D), ?IS_ALPHANUM(E) ->
  1100. langtag_variant(R, Acc, << T/binary, $-, ?LC(A), ?LC(B), ?LC(C), ?LC(D), ?LC(E) >>);
  1101. langtag_region(<< $-, A, B, C, D, R/bits >>, Acc, T)
  1102. when ?IS_DIGIT(A), ?IS_ALPHANUM(B), ?IS_ALPHANUM(C), ?IS_ALPHANUM(D) ->
  1103. langtag_variant(R, Acc, << T/binary, $-, A, ?LC(B), ?LC(C), ?LC(D) >>);
  1104. langtag_region(<< $-, A, B, R/bits >>, Acc, T) when ?IS_ALPHA(A), ?IS_ALPHA(B) ->
  1105. langtag_variant(R, Acc, << T/binary, $-, ?LC(A), ?LC(B) >>);
  1106. langtag_region(<< $-, A, B, C, R/bits >>, Acc, T) when ?IS_DIGIT(A), ?IS_DIGIT(B), ?IS_DIGIT(C) ->
  1107. langtag_variant(R, Acc, << T/binary, $-, A, B, C >>);
  1108. langtag_region(R, Acc, T) ->
  1109. langtag_variant(R, Acc, T).
  1110. langtag_variant(<< $-, A, B, C, D, E, F, G, H, R/bits >>, Acc, T)
  1111. when ?IS_ALPHANUM(A), ?IS_ALPHANUM(B), ?IS_ALPHANUM(C), ?IS_ALPHANUM(D),
  1112. ?IS_ALPHANUM(E), ?IS_ALPHANUM(F), ?IS_ALPHANUM(G), ?IS_ALPHANUM(H) ->
  1113. langtag_variant(R, Acc, << T/binary, $-, ?LC(A), ?LC(B), ?LC(C), ?LC(D), ?LC(E), ?LC(F), ?LC(G), ?LC(H) >>);
  1114. langtag_variant(<< $-, A, B, C, D, E, F, G, R/bits >>, Acc, T)
  1115. when ?IS_ALPHANUM(A), ?IS_ALPHANUM(B), ?IS_ALPHANUM(C), ?IS_ALPHANUM(D),
  1116. ?IS_ALPHANUM(E), ?IS_ALPHANUM(F), ?IS_ALPHANUM(G) ->
  1117. langtag_variant(R, Acc, << T/binary, $-, ?LC(A), ?LC(B), ?LC(C), ?LC(D), ?LC(E), ?LC(F), ?LC(G) >>);
  1118. langtag_variant(<< $-, A, B, C, D, E, F, R/bits >>, Acc, T)
  1119. when ?IS_ALPHANUM(A), ?IS_ALPHANUM(B), ?IS_ALPHANUM(C), ?IS_ALPHANUM(D),
  1120. ?IS_ALPHANUM(E), ?IS_ALPHANUM(F) ->
  1121. langtag_variant(R, Acc, << T/binary, $-, ?LC(A), ?LC(B), ?LC(C), ?LC(D), ?LC(E), ?LC(F) >>);
  1122. langtag_variant(<< $-, A, B, C, D, E, R/bits >>, Acc, T)
  1123. when ?IS_ALPHANUM(A), ?IS_ALPHANUM(B), ?IS_ALPHANUM(C), ?IS_ALPHANUM(D), ?IS_ALPHANUM(E) ->
  1124. langtag_variant(R, Acc, << T/binary, $-, ?LC(A), ?LC(B), ?LC(C), ?LC(D), ?LC(E) >>);
  1125. langtag_variant(<< $-, A, B, C, D, R/bits >>, Acc, T)
  1126. when ?IS_DIGIT(A), ?IS_ALPHANUM(B), ?IS_ALPHANUM(C), ?IS_ALPHANUM(D) ->
  1127. langtag_variant(R, Acc, << T/binary, $-, A, ?LC(B), ?LC(C), ?LC(D) >>);
  1128. langtag_variant(R, Acc, T) ->
  1129. langtag_extension(R, Acc, T).
  1130. langtag_extension(<< $-, X, R/bits >>, Acc, T) when X =:= $x; X =:= $X -> langtag_privateuse_sub(R, Acc, << T/binary, $-, $x >>, 0);
  1131. langtag_extension(<< $-, S, R/bits >>, Acc, T) when ?IS_ALPHANUM(S) -> langtag_extension_sub(R, Acc, << T/binary, $-, ?LC(S) >>, 0);
  1132. langtag_extension(R, Acc, T) -> langtag_list_sep(R, [T|Acc]).
  1133. langtag_extension_sub(<< $-, A, B, C, D, E, F, G, H, R/bits >>, Acc, T, N)
  1134. when ?IS_ALPHANUM(A), ?IS_ALPHANUM(B), ?IS_ALPHANUM(C), ?IS_ALPHANUM(D),
  1135. ?IS_ALPHANUM(E), ?IS_ALPHANUM(F), ?IS_ALPHANUM(G), ?IS_ALPHANUM(H) ->
  1136. langtag_extension_sub(R, Acc, << T/binary, $-, ?LC(A), ?LC(B), ?LC(C), ?LC(D), ?LC(E), ?LC(F), ?LC(G), ?LC(H) >>, N + 1);
  1137. langtag_extension_sub(<< $-, A, B, C, D, E, F, G, R/bits >>, Acc, T, N)
  1138. when ?IS_ALPHANUM(A), ?IS_ALPHANUM(B), ?IS_ALPHANUM(C), ?IS_ALPHANUM(D),
  1139. ?IS_ALPHANUM(E), ?IS_ALPHANUM(F), ?IS_ALPHANUM(G) ->
  1140. langtag_extension_sub(R, Acc, << T/binary, $-, ?LC(A), ?LC(B), ?LC(C), ?LC(D), ?LC(E), ?LC(F), ?LC(G) >>, N + 1);
  1141. langtag_extension_sub(<< $-, A, B, C, D, E, F, R/bits >>, Acc, T, N)
  1142. when ?IS_ALPHANUM(A), ?IS_ALPHANUM(B), ?IS_ALPHANUM(C), ?IS_ALPHANUM(D),
  1143. ?IS_ALPHANUM(E), ?IS_ALPHANUM(F) ->
  1144. langtag_extension_sub(R, Acc, << T/binary, $-, ?LC(A), ?LC(B), ?LC(C), ?LC(D), ?LC(E), ?LC(F) >>, N + 1);
  1145. langtag_extension_sub(<< $-, A, B, C, D, E, R/bits >>, Acc, T, N)
  1146. when ?IS_ALPHANUM(A), ?IS_ALPHANUM(B), ?IS_ALPHANUM(C), ?IS_ALPHANUM(D), ?IS_ALPHANUM(E) ->
  1147. langtag_extension_sub(R, Acc, << T/binary, $-, ?LC(A), ?LC(B), ?LC(C), ?LC(D), ?LC(E) >>, N + 1);
  1148. langtag_extension_sub(<< $-, A, B, C, D, R/bits >>, Acc, T, N)
  1149. when ?IS_ALPHANUM(A), ?IS_ALPHANUM(B), ?IS_ALPHANUM(C), ?IS_ALPHANUM(D) ->
  1150. langtag_extension_sub(R, Acc, << T/binary, $-, ?LC(A), ?LC(B), ?LC(C), ?LC(D) >>, N + 1);
  1151. langtag_extension_sub(<< $-, A, B, C, R/bits >>, Acc, T, N)
  1152. when ?IS_ALPHANUM(A), ?IS_ALPHANUM(B), ?IS_ALPHANUM(C) ->
  1153. langtag_extension_sub(R, Acc, << T/binary, $-, ?LC(A), ?LC(B), ?LC(C) >>, N + 1);
  1154. langtag_extension_sub(<< $-, A, B, R/bits >>, Acc, T, N)
  1155. when ?IS_ALPHANUM(A), ?IS_ALPHANUM(B) ->
  1156. langtag_extension_sub(R, Acc, << T/binary, $-, ?LC(A), ?LC(B) >>, N + 1);
  1157. langtag_extension_sub(R, Acc, T, N) when N > 0 ->
  1158. langtag_extension(R, Acc, T).
  1159. langtag_privateuse_sub(<< $-, A, B, C, D, E, F, G, H, R/bits >>, Acc, T, N)
  1160. when ?IS_ALPHANUM(A), ?IS_ALPHANUM(B), ?IS_ALPHANUM(C), ?IS_ALPHANUM(D),
  1161. ?IS_ALPHANUM(E), ?IS_ALPHANUM(F), ?IS_ALPHANUM(G), ?IS_ALPHANUM(H) ->
  1162. langtag_privateuse_sub(R, Acc, << T/binary, $-, ?LC(A), ?LC(B), ?LC(C), ?LC(D), ?LC(E), ?LC(F), ?LC(G), ?LC(H) >>, N + 1);
  1163. langtag_privateuse_sub(<< $-, A, B, C, D, E, F, G, R/bits >>, Acc, T, N)
  1164. when ?IS_ALPHANUM(A), ?IS_ALPHANUM(B), ?IS_ALPHANUM(C), ?IS_ALPHANUM(D),
  1165. ?IS_ALPHANUM(E), ?IS_ALPHANUM(F), ?IS_ALPHANUM(G) ->
  1166. langtag_privateuse_sub(R, Acc, << T/binary, $-, ?LC(A), ?LC(B), ?LC(C), ?LC(D), ?LC(E), ?LC(F), ?LC(G) >>, N + 1);
  1167. langtag_privateuse_sub(<< $-, A, B, C, D, E, F, R/bits >>, Acc, T, N)
  1168. when ?IS_ALPHANUM(A), ?IS_ALPHANUM(B), ?IS_ALPHANUM(C), ?IS_ALPHANUM(D),
  1169. ?IS_ALPHANUM(E), ?IS_ALPHANUM(F) ->
  1170. langtag_privateuse_sub(R, Acc, << T/binary, $-, ?LC(A), ?LC(B), ?LC(C), ?LC(D), ?LC(E), ?LC(F) >>, N + 1);
  1171. langtag_privateuse_sub(<< $-, A, B, C, D, E, R/bits >>, Acc, T, N)
  1172. when ?IS_ALPHANUM(A), ?IS_ALPHANUM(B), ?IS_ALPHANUM(C), ?IS_ALPHANUM(D), ?IS_ALPHANUM(E) ->
  1173. langtag_privateuse_sub(R, Acc, << T/binary, $-, ?LC(A), ?LC(B), ?LC(C), ?LC(D), ?LC(E) >>, N + 1);
  1174. langtag_privateuse_sub(<< $-, A, B, C, D, R/bits >>, Acc, T, N)
  1175. when ?IS_ALPHANUM(A), ?IS_ALPHANUM(B), ?IS_ALPHANUM(C), ?IS_ALPHANUM(D) ->
  1176. langtag_privateuse_sub(R, Acc, << T/binary, $-, ?LC(A), ?LC(B), ?LC(C), ?LC(D) >>, N + 1);
  1177. langtag_privateuse_sub(<< $-, A, B, C, R/bits >>, Acc, T, N)
  1178. when ?IS_ALPHANUM(A), ?IS_ALPHANUM(B), ?IS_ALPHANUM(C) ->
  1179. langtag_privateuse_sub(R, Acc, << T/binary, $-, ?LC(A), ?LC(B), ?LC(C) >>, N + 1);
  1180. langtag_privateuse_sub(<< $-, A, B, R/bits >>, Acc, T, N)
  1181. when ?IS_ALPHANUM(A), ?IS_ALPHANUM(B) ->
  1182. langtag_privateuse_sub(R, Acc, << T/binary, $-, ?LC(A), ?LC(B) >>, N + 1);
  1183. langtag_privateuse_sub(<< $-, A, R/bits >>, Acc, T, N)
  1184. when ?IS_ALPHANUM(A) ->
  1185. langtag_privateuse_sub(R, Acc, << T/binary, $-, ?LC(A) >>, N + 1);
  1186. langtag_privateuse_sub(R, Acc, T, N) when N > 0 -> langtag_list_sep(R, [T|Acc]).
  1187. langtag_list_sep(<<>>, Acc) -> lists:reverse(Acc);
  1188. langtag_list_sep(<< $,, R/bits >>, Acc) -> langtag_list(R, Acc);
  1189. langtag_list_sep(<< C, R/bits >>, Acc) when ?IS_WS(C) -> langtag_list_sep(R, Acc).
  1190. -ifdef(TEST).
  1191. langtag_language() -> vector(2, 3, alpha()).
  1192. langtag_extlang() -> vector(0, 3, [$-, alpha(), alpha(), alpha()]).
  1193. langtag_script() -> oneof([[], [$-, alpha(), alpha(), alpha(), alpha()]]).
  1194. langtag_region() -> oneof([[], [$-, alpha(), alpha()], [$-, digit(), digit(), digit()]]).
  1195. langtag_variant() ->
  1196. small_list(frequency([
  1197. {4, [$-, vector(5, 8, alphanum())]},
  1198. {1, [$-, digit(), alphanum(), alphanum(), alphanum()]}
  1199. ])).
  1200. langtag_extension() ->
  1201. small_list([$-, ?SUCHTHAT(S, alphanum(), S =/= $x andalso S =/= $X),
  1202. small_non_empty_list([$-, vector(2, 8, alphanum())])
  1203. ]).
  1204. langtag_privateuse() -> oneof([[], [$-, langtag_privateuse_nodash()]]).
  1205. langtag_privateuse_nodash() -> [elements([$x, $X]), small_non_empty_list([$-, vector(1, 8, alphanum())])].
  1206. private_language_tag() -> ?LET(T, langtag_privateuse_nodash(), iolist_to_binary(T)).
  1207. language_tag() ->
  1208. ?LET(IoList,
  1209. [langtag_language(), langtag_extlang(), langtag_script(), langtag_region(),
  1210. langtag_variant(), langtag_extension(), langtag_privateuse()],
  1211. iolist_to_binary(IoList)).
  1212. content_language() ->
  1213. ?LET(L,
  1214. non_empty(list(frequency([
  1215. {90, language_tag()},
  1216. {10, private_language_tag()}
  1217. ]))),
  1218. begin
  1219. << _, ContentLanguage/binary >> = iolist_to_binary([[$,, T] || T <- L]),
  1220. {L, ContentLanguage}
  1221. end).
  1222. prop_parse_content_language() ->
  1223. ?FORALL({L, ContentLanguage},
  1224. content_language(),
  1225. begin
  1226. ResL = parse_content_language(ContentLanguage),
  1227. CheckedL = [?LOWER(T) =:= ResT || {T, ResT} <- lists:zip(L, ResL)],
  1228. [true] =:= lists:usort(CheckedL)
  1229. end).
  1230. parse_content_language_test_() ->
  1231. Tests = [
  1232. {<<"de">>, [<<"de">>]},
  1233. {<<"fr">>, [<<"fr">>]},
  1234. {<<"ja">>, [<<"ja">>]},
  1235. {<<"zh-Hant">>, [<<"zh-hant">>]},
  1236. {<<"zh-Hans">>, [<<"zh-hans">>]},
  1237. {<<"sr-Cyrl">>, [<<"sr-cyrl">>]},
  1238. {<<"sr-Latn">>, [<<"sr-latn">>]},
  1239. {<<"zh-cmn-Hans-CN">>, [<<"zh-cmn-hans-cn">>]},
  1240. {<<"cmn-Hans-CN">>, [<<"cmn-hans-cn">>]},
  1241. {<<"zh-yue-HK">>, [<<"zh-yue-hk">>]},
  1242. {<<"yue-HK">>, [<<"yue-hk">>]},
  1243. {<<"zh-Hans-CN">>, [<<"zh-hans-cn">>]},
  1244. {<<"sr-Latn-RS">>, [<<"sr-latn-rs">>]},
  1245. {<<"sl-rozaj">>, [<<"sl-rozaj">>]},
  1246. {<<"sl-rozaj-biske">>, [<<"sl-rozaj-biske">>]},
  1247. {<<"sl-nedis">>, [<<"sl-nedis">>]},
  1248. {<<"de-CH-1901">>, [<<"de-ch-1901">>]},
  1249. {<<"sl-IT-nedis">>, [<<"sl-it-nedis">>]},
  1250. {<<"hy-Latn-IT-arevela">>, [<<"hy-latn-it-arevela">>]},
  1251. {<<"de-DE">>, [<<"de-de">>]},
  1252. {<<"en-US">>, [<<"en-us">>]},
  1253. {<<"es-419">>, [<<"es-419">>]},
  1254. {<<"de-CH-x-phonebk">>, [<<"de-ch-x-phonebk">>]},
  1255. {<<"az-Arab-x-AZE-derbend">>, [<<"az-arab-x-aze-derbend">>]},
  1256. {<<"x-whatever">>, [<<"x-whatever">>]},
  1257. {<<"qaa-Qaaa-QM-x-southern">>, [<<"qaa-qaaa-qm-x-southern">>]},
  1258. {<<"de-Qaaa">>, [<<"de-qaaa">>]},
  1259. {<<"sr-Latn-QM">>, [<<"sr-latn-qm">>]},
  1260. {<<"sr-Qaaa-RS">>, [<<"sr-qaaa-rs">>]},
  1261. {<<"en-US-u-islamcal">>, [<<"en-us-u-islamcal">>]},
  1262. {<<"zh-CN-a-myext-x-private">>, [<<"zh-cn-a-myext-x-private">>]},
  1263. {<<"en-a-myext-b-another">>, [<<"en-a-myext-b-another">>]},
  1264. {<<"mn-Cyrl-MN">>, [<<"mn-cyrl-mn">>]},
  1265. {<<"MN-cYRL-mn">>, [<<"mn-cyrl-mn">>]},
  1266. {<<"mN-cYrL-Mn">>, [<<"mn-cyrl-mn">>]},
  1267. {<<"az-Arab-IR">>, [<<"az-arab-ir">>]},
  1268. {<<"zh-gan">>, [<<"zh-gan">>]},
  1269. {<<"zh-yue">>, [<<"zh-yue">>]},
  1270. {<<"zh-cmn">>, [<<"zh-cmn">>]},
  1271. {<<"de-AT">>, [<<"de-at">>]},
  1272. {<<"de-CH-1996">>, [<<"de-ch-1996">>]},
  1273. {<<"en-Latn-GB-boont-r-extended-sequence-x-private">>,
  1274. [<<"en-latn-gb-boont-r-extended-sequence-x-private">>]},
  1275. {<<"el-x-koine">>, [<<"el-x-koine">>]},
  1276. {<<"el-x-attic">>, [<<"el-x-attic">>]},
  1277. {<<"fr, en-US, es-419, az-Arab, x-pig-latin, man-Nkoo-GN">>,
  1278. [<<"fr">>, <<"en-us">>, <<"es-419">>, <<"az-arab">>, <<"x-pig-latin">>, <<"man-nkoo-gn">>]},
  1279. {<<"da">>, [<<"da">>]},
  1280. {<<"mi, en">>, [<<"mi">>, <<"en">>]}
  1281. ],
  1282. [{V, fun() -> R = parse_content_language(V) end} || {V, R} <- Tests].
  1283. parse_content_language_error_test_() ->
  1284. Tests = [
  1285. <<>>
  1286. ],
  1287. [{V, fun() -> {'EXIT', _} = (catch parse_content_language(V)) end} || V <- Tests].
  1288. horse_parse_content_language() ->
  1289. horse:repeat(100000,
  1290. parse_content_language(<<"fr, en-US, es-419, az-Arab, x-pig-latin, man-Nkoo-GN">>)
  1291. ).
  1292. -endif.
  1293. %% @doc Parse the Content-Length header.
  1294. -spec parse_content_length(binary()) -> non_neg_integer().
  1295. parse_content_length(ContentLength) ->
  1296. I = binary_to_integer(ContentLength),
  1297. true = I >= 0,
  1298. I.
  1299. -ifdef(TEST).
  1300. prop_parse_content_length() ->
  1301. ?FORALL(
  1302. X,
  1303. non_neg_integer(),
  1304. X =:= parse_content_length(integer_to_binary(X))
  1305. ).
  1306. parse_content_length_test_() ->
  1307. Tests = [
  1308. {<<"0">>, 0},
  1309. {<<"42">>, 42},
  1310. {<<"69">>, 69},
  1311. {<<"1337">>, 1337},
  1312. {<<"3495">>, 3495},
  1313. {<<"1234567890">>, 1234567890}
  1314. ],
  1315. [{V, fun() -> R = parse_content_length(V) end} || {V, R} <- Tests].
  1316. parse_content_length_error_test_() ->
  1317. Tests = [
  1318. <<>>,
  1319. <<"-1">>,
  1320. <<"123, 123">>,
  1321. <<"4.17">>
  1322. ],
  1323. [{V, fun() -> {'EXIT', _} = (catch parse_content_length(V)) end} || V <- Tests].
  1324. horse_parse_content_length_zero() ->
  1325. horse:repeat(100000,
  1326. parse_content_length(<<"0">>)
  1327. ).
  1328. horse_parse_content_length_giga() ->
  1329. horse:repeat(100000,
  1330. parse_content_length(<<"1234567890">>)
  1331. ).
  1332. -endif.
  1333. %% @doc Parse the Content-Range header.
  1334. -spec parse_content_range(binary())
  1335. -> {bytes, non_neg_integer(), non_neg_integer(), non_neg_integer() | '*'}
  1336. | {bytes, '*', non_neg_integer()} | {binary(), binary()}.
  1337. parse_content_range(<<"bytes */", C, R/bits >>) when ?IS_DIGIT(C) -> unsatisfied_range(R, C - $0);
  1338. parse_content_range(<<"bytes ", C, R/bits >>) when ?IS_DIGIT(C) -> byte_range_first(R, C - $0);
  1339. parse_content_range(<< C, R/bits >>) when ?IS_TOKEN(C) ->
  1340. ?LOWER(other_content_range_unit, R, <<>>).
  1341. byte_range_first(<< $-, C, R/bits >>, First) when ?IS_DIGIT(C) -> byte_range_last(R, First, C - $0);
  1342. byte_range_first(<< C, R/bits >>, First) when ?IS_DIGIT(C) -> byte_range_first(R, First * 10 + C - $0).
  1343. byte_range_last(<<"/*">>, First, Last) -> {bytes, First, Last, '*'};
  1344. byte_range_last(<< $/, C, R/bits >>, First, Last) when ?IS_DIGIT(C) -> byte_range_complete(R, First, Last, C - $0);
  1345. byte_range_last(<< C, R/bits >>, First, Last) when ?IS_DIGIT(C) -> byte_range_last(R, First, Last * 10 + C - $0).
  1346. byte_range_complete(<<>>, First, Last, Complete) -> {bytes, First, Last, Complete};
  1347. byte_range_complete(<< C, R/bits >>, First, Last, Complete) when ?IS_DIGIT(C) ->
  1348. byte_range_complete(R, First, Last, Complete * 10 + C - $0).
  1349. unsatisfied_range(<<>>, Complete) -> {bytes, '*', Complete};
  1350. unsatisfied_range(<< C, R/bits >>, Complete) when ?IS_DIGIT(C) -> unsatisfied_range(R, Complete * 10 + C - $0).
  1351. other_content_range_unit(<< $\s, R/bits >>, Unit) -> other_content_range_resp(R, Unit, <<>>);
  1352. other_content_range_unit(<< C, R/bits >>, Unit) when ?IS_TOKEN(C) ->
  1353. ?LOWER(other_content_range_unit, R, Unit).
  1354. other_content_range_resp(<<>>, Unit, Resp) -> {Unit, Resp};
  1355. other_content_range_resp(<< C, R/bits >>, Unit, Resp) when ?IS_CHAR(C) -> other_content_range_resp(R, Unit, << Resp/binary, C >>).
  1356. -ifdef(TEST).
  1357. content_range() ->
  1358. ?LET(ContentRange,
  1359. oneof([
  1360. ?SUCHTHAT({bytes, First, Last, Complete},
  1361. {bytes, non_neg_integer(), non_neg_integer(), non_neg_integer()},
  1362. First =< Last andalso Last < Complete),
  1363. ?SUCHTHAT({bytes, First, Last, '*'},
  1364. {bytes, non_neg_integer(), non_neg_integer(), '*'},
  1365. First =< Last),
  1366. {bytes, '*', non_neg_integer()},
  1367. {token(), ?LET(L, list(abnf_char()), list_to_binary(L))}
  1368. ]),
  1369. {case ContentRange of
  1370. {Unit, Resp} when is_binary(Unit) -> {?LOWER(Unit), Resp};
  1371. _ -> ContentRange
  1372. end, case ContentRange of
  1373. {bytes, First, Last, '*'} ->
  1374. << "bytes ", (integer_to_binary(First))/binary, "-",
  1375. (integer_to_binary(Last))/binary, "/*">>;
  1376. {bytes, First, Last, Complete} ->
  1377. << "bytes ", (integer_to_binary(First))/binary, "-",
  1378. (integer_to_binary(Last))/binary, "/", (integer_to_binary(Complete))/binary >>;
  1379. {bytes, '*', Complete} ->
  1380. << "bytes */", (integer_to_binary(Complete))/binary >>;
  1381. {Unit, Resp} ->
  1382. << Unit/binary, $\s, Resp/binary >>
  1383. end}).
  1384. prop_parse_content_range() ->
  1385. ?FORALL({Res, ContentRange},
  1386. content_range(),
  1387. Res =:= parse_content_range(ContentRange)).
  1388. parse_content_range_test_() ->
  1389. Tests = [
  1390. {<<"bytes 21010-47021/47022">>, {bytes, 21010, 47021, 47022}},
  1391. {<<"bytes 500-999/8000">>, {bytes, 500, 999, 8000}},
  1392. {<<"bytes 7000-7999/8000">>, {bytes, 7000, 7999, 8000}},
  1393. {<<"bytes 42-1233/1234">>, {bytes, 42, 1233, 1234}},
  1394. {<<"bytes 42-1233/*">>, {bytes, 42, 1233, '*'}},
  1395. {<<"bytes */1234">>, {bytes, '*', 1234}},
  1396. {<<"bytes 0-499/1234">>, {bytes, 0, 499, 1234}},
  1397. {<<"bytes 500-999/1234">>, {bytes, 500, 999, 1234}},
  1398. {<<"bytes 500-1233/1234">>, {bytes, 500, 1233, 1234}},
  1399. {<<"bytes 734-1233/1234">>, {bytes, 734, 1233, 1234}},
  1400. {<<"bytes */47022">>, {bytes, '*', 47022}},
  1401. {<<"exampleunit 1.2-4.3/25">>, {<<"exampleunit">>, <<"1.2-4.3/25">>}},
  1402. {<<"exampleunit 11.2-14.3/25">>, {<<"exampleunit">>, <<"11.2-14.3/25">>}}
  1403. ],
  1404. [{V, fun() -> R = parse_content_range(V) end} || {V, R} <- Tests].
  1405. parse_content_range_error_test_() ->
  1406. Tests = [
  1407. <<>>
  1408. ],
  1409. [{V, fun() -> {'EXIT', _} = (catch parse_content_range(V)) end} || V <- Tests].
  1410. horse_parse_content_range_bytes() ->
  1411. horse:repeat(200000,
  1412. parse_content_range(<<"bytes 21010-47021/47022">>)
  1413. ).
  1414. horse_parse_content_range_other() ->
  1415. horse:repeat(200000,
  1416. parse_content_range(<<"exampleunit 11.2-14.3/25">>)
  1417. ).
  1418. -endif.
  1419. %% @doc Parse the Content-Type header.
  1420. -spec parse_content_type(binary()) -> media_type().
  1421. parse_content_type(<< C, R/bits >>) when ?IS_TOKEN(C) ->
  1422. ?LOWER(media_type, R, <<>>).
  1423. media_type(<< $/, C, R/bits >>, T) when ?IS_TOKEN(C) ->
  1424. ?LOWER(media_subtype, R, T, <<>>);
  1425. media_type(<< C, R/bits >>, T) when ?IS_TOKEN(C) ->
  1426. ?LOWER(media_type, R, T).
  1427. media_subtype(<< C, R/bits >>, T, S) when ?IS_TOKEN(C) ->
  1428. ?LOWER(media_subtype, R, T, S);
  1429. media_subtype(R, T, S) -> media_param_sep(R, T, S, []).
  1430. media_param_sep(<<>>, T, S, P) -> {T, S, lists:reverse(P)};
  1431. media_param_sep(<< $;, R/bits >>, T, S, P) -> media_before_param(R, T, S, P);
  1432. media_param_sep(<< C, R/bits >>, T, S, P) when ?IS_WS(C) -> media_param_sep(R, T, S, P).
  1433. media_before_param(<< C, R/bits >>, T, S, P) when ?IS_WS(C)-> media_before_param(R, T, S, P);
  1434. media_before_param(<< "charset=", $", R/bits >>, T, S, P) -> media_charset_quoted(R, T, S, P, <<>>);
  1435. media_before_param(<< "charset=", R/bits >>, T, S, P) -> media_charset(R, T, S, P, <<>>);
  1436. media_before_param(<< C, R/bits >>, T, S, P) when ?IS_TOKEN(C) ->
  1437. ?LOWER(media_param, R, T, S, P, <<>>).
  1438. media_charset_quoted(<< $", R/bits >>, T, S, P, V) ->
  1439. media_param_sep(R, T, S, [{<<"charset">>, V}|P]);
  1440. media_charset_quoted(<< $\\, C, R/bits >>, T, S, P, V) when ?IS_VCHAR_OBS(C) ->
  1441. ?LOWER(media_charset_quoted, R, T, S, P, V);
  1442. media_charset_quoted(<< C, R/bits >>, T, S, P, V) when ?IS_VCHAR_OBS(C) ->
  1443. ?LOWER(media_charset_quoted, R, T, S, P, V).
  1444. media_charset(<< C, R/bits >>, T, S, P, V) when ?IS_TOKEN(C) ->
  1445. ?LOWER(media_charset, R, T, S, P, V);
  1446. media_charset(R, T, S, P, V) -> media_param_sep(R, T, S, [{<<"charset">>, V}|P]).
  1447. media_param(<< $=, $", R/bits >>, T, S, P, K) -> media_quoted(R, T, S, P, K, <<>>);
  1448. media_param(<< $=, C, R/bits >>, T, S, P, K) when ?IS_TOKEN(C) -> media_value(R, T, S, P, K, << C >>);
  1449. media_param(<< C, R/bits >>, T, S, P, K) when ?IS_TOKEN(C) ->
  1450. ?LOWER(media_param, R, T, S, P, K).
  1451. media_quoted(<< $", R/bits >>, T, S, P, K, V) -> media_param_sep(R, T, S, [{K, V}|P]);
  1452. media_quoted(<< $\\, C, R/bits >>, T, S, P, K, V) when ?IS_VCHAR_OBS(C) -> media_quoted(R, T, S, P, K, << V/binary, C >>);
  1453. media_quoted(<< C, R/bits >>, T, S, P, K, V) when ?IS_VCHAR_OBS(C) -> media_quoted(R, T, S, P, K, << V/binary, C >>).
  1454. media_value(<< C, R/bits >>, T, S, P, K, V) when ?IS_TOKEN(C) -> media_value(R, T, S, P, K, << V/binary, C >>);
  1455. media_value(R, T, S, P, K, V) -> media_param_sep(R, T, S, [{K, V}|P]).
  1456. -ifdef(TEST).
  1457. media_type_parameter() ->
  1458. frequency([
  1459. {90, parameter()},
  1460. {10, {<<"charset">>, oneof([token(), quoted_string()]), <<>>, <<>>}}
  1461. ]).
  1462. media_type() ->
  1463. ?LET({T, S, P},
  1464. {token(), token(), small_list(media_type_parameter())},
  1465. {T, S, P, iolist_to_binary([T, $/, S, [[OWS1, $;, OWS2, K, $=, V] || {K, V, OWS1, OWS2} <- P]])}
  1466. ).
  1467. prop_parse_content_type() ->
  1468. ?FORALL({T, S, P, MediaType},
  1469. media_type(),
  1470. begin
  1471. {ResT, ResS, ResP} = parse_content_type(MediaType),
  1472. ExpectedP = [case ?LOWER(K) of
  1473. <<"charset">> -> {<<"charset">>, ?LOWER(unquote(V))};
  1474. LowK -> {LowK, unquote(V)}
  1475. end || {K, V, _, _} <- P],
  1476. ResT =:= ?LOWER(T)
  1477. andalso ResS =:= ?LOWER(S)
  1478. andalso ResP =:= ExpectedP
  1479. end
  1480. ).
  1481. parse_content_type_test_() ->
  1482. Tests = [
  1483. {<<"text/html;charset=utf-8">>,
  1484. {<<"text">>, <<"html">>, [{<<"charset">>, <<"utf-8">>}]}},
  1485. {<<"text/html;charset=UTF-8">>,
  1486. {<<"text">>, <<"html">>, [{<<"charset">>, <<"utf-8">>}]}},
  1487. {<<"Text/HTML;Charset=\"utf-8\"">>,
  1488. {<<"text">>, <<"html">>, [{<<"charset">>, <<"utf-8">>}]}},
  1489. {<<"text/html; charset=\"utf-8\"">>,
  1490. {<<"text">>, <<"html">>, [{<<"charset">>, <<"utf-8">>}]}},
  1491. {<<"text/html; charset=ISO-8859-4">>,
  1492. {<<"text">>, <<"html">>, [{<<"charset">>, <<"iso-8859-4">>}]}},
  1493. {<<"text/plain; charset=iso-8859-4">>,
  1494. {<<"text">>, <<"plain">>, [{<<"charset">>, <<"iso-8859-4">>}]}},
  1495. {<<"multipart/form-data \t;Boundary=\"MultipartIsUgly\"">>,
  1496. {<<"multipart">>, <<"form-data">>, [
  1497. {<<"boundary">>, <<"MultipartIsUgly">>}
  1498. ]}},
  1499. {<<"foo/bar; one=FirstParam; two=SecondParam">>,
  1500. {<<"foo">>, <<"bar">>, [
  1501. {<<"one">>, <<"FirstParam">>},
  1502. {<<"two">>, <<"SecondParam">>}
  1503. ]}}
  1504. ],
  1505. [{V, fun() -> R = parse_content_type(V) end} || {V, R} <- Tests].
  1506. horse_parse_content_type() ->
  1507. horse:repeat(200000,
  1508. parse_content_type(<<"text/html;charset=utf-8">>)
  1509. ).
  1510. -endif.
  1511. %% @doc Parse the Date header.
  1512. -spec parse_date(binary()) -> calendar:datetime().
  1513. parse_date(Date) ->
  1514. cow_date:parse_date(Date).
  1515. -ifdef(TEST).
  1516. parse_date_test_() ->
  1517. Tests = [
  1518. {<<"Tue, 15 Nov 1994 08:12:31 GMT">>, {{1994, 11, 15}, {8, 12, 31}}}
  1519. ],
  1520. [{V, fun() -> R = parse_date(V) end} || {V, R} <- Tests].
  1521. -endif.
  1522. %% @doc Parse the ETag header.
  1523. -spec parse_etag(binary()) -> etag().
  1524. parse_etag(<< $W, $/, $", R/bits >>) ->
  1525. etag(R, weak, <<>>);
  1526. parse_etag(<< $", R/bits >>) ->
  1527. etag(R, strong, <<>>).
  1528. etag(<< $" >>, Strength, Tag) ->
  1529. {Strength, Tag};
  1530. etag(<< C, R/bits >>, Strength, Tag) when ?IS_ETAGC(C) ->
  1531. etag(R, Strength, << Tag/binary, C >>).
  1532. -ifdef(TEST).
  1533. etagc() ->
  1534. ?SUCHTHAT(C, int(16#21, 16#ff), C =/= 16#22 andalso C =/= 16#7f).
  1535. etag() ->
  1536. ?LET({Strength, Tag},
  1537. {elements([weak, strong]), list(etagc())},
  1538. begin
  1539. TagBin = list_to_binary(Tag),
  1540. {{Strength, TagBin},
  1541. case Strength of
  1542. weak -> << $W, $/, $", TagBin/binary, $" >>;
  1543. strong -> << $", TagBin/binary, $" >>
  1544. end}
  1545. end).
  1546. prop_parse_etag() ->
  1547. ?FORALL({Tag, TagBin},
  1548. etag(),
  1549. Tag =:= parse_etag(TagBin)).
  1550. parse_etag_test_() ->
  1551. Tests = [
  1552. {<<"\"xyzzy\"">>, {strong, <<"xyzzy">>}},
  1553. {<<"W/\"xyzzy\"">>, {weak, <<"xyzzy">>}},
  1554. {<<"\"\"">>, {strong, <<>>}}
  1555. ],
  1556. [{V, fun() -> R = parse_etag(V) end} || {V, R} <- Tests].
  1557. parse_etag_error_test_() ->
  1558. Tests = [
  1559. <<>>,
  1560. <<"\"">>,
  1561. <<"W">>,
  1562. <<"W/">>
  1563. ],
  1564. [{V, fun() -> {'EXIT', _} = (catch parse_etag(V)) end} || V <- Tests].
  1565. horse_parse_etag() ->
  1566. horse:repeat(200000,
  1567. parse_etag(<<"W/\"xyzzy\"">>)
  1568. ).
  1569. -endif.
  1570. %% @doc Parse the Expect header.
  1571. -spec parse_expect(binary()) -> continue.
  1572. parse_expect(<<"100-continue">>) ->
  1573. continue;
  1574. parse_expect(<<"100-", C, O, N, T, I, M, U, E >>)
  1575. when (C =:= $C) or (C =:= $c), (O =:= $O) or (O =:= $o),
  1576. (N =:= $N) or (N =:= $n), (T =:= $T) or (T =:= $t),
  1577. (I =:= $I) or (I =:= $i), (M =:= $N) or (M =:= $n),
  1578. (U =:= $U) or (U =:= $u), (E =:= $E) or (E =:= $e) ->
  1579. continue.
  1580. -ifdef(TEST).
  1581. expect() ->
  1582. ?LET(E,
  1583. [$1, $0, $0, $-,
  1584. elements([$c, $C]), elements([$o, $O]), elements([$n, $N]),
  1585. elements([$t, $T]), elements([$i, $I]), elements([$n, $N]),
  1586. elements([$u, $U]), elements([$e, $E])],
  1587. list_to_binary(E)).
  1588. prop_parse_expect() ->
  1589. ?FORALL(E, expect(), continue =:= parse_expect(E)).
  1590. parse_expect_test_() ->
  1591. Tests = [
  1592. <<"100-continue">>,
  1593. <<"100-CONTINUE">>,
  1594. <<"100-Continue">>,
  1595. <<"100-CoNtInUe">>
  1596. ],
  1597. [{V, fun() -> continue = parse_expect(V) end} || V <- Tests].
  1598. parse_expect_error_test_() ->
  1599. Tests = [
  1600. <<>>,
  1601. <<" ">>,
  1602. <<"200-OK">>,
  1603. <<"Cookies">>
  1604. ],
  1605. [{V, fun() -> {'EXIT', _} = (catch parse_expect(V)) end} || V <- Tests].
  1606. horse_parse_expect() ->
  1607. horse:repeat(200000,
  1608. parse_expect(<<"100-continue">>)
  1609. ).
  1610. -endif.
  1611. %% @doc Parse the Expires header.
  1612. %%
  1613. %% Recipients must interpret invalid date formats as a date
  1614. %% in the past. The value "0" is commonly used.
  1615. -spec parse_expires(binary()) -> calendar:datetime().
  1616. parse_expires(<<"0">>) ->
  1617. {{1, 1, 1}, {0, 0, 0}};
  1618. parse_expires(Expires) ->
  1619. try
  1620. cow_date:parse_date(Expires)
  1621. catch _:_ ->
  1622. {{1, 1, 1}, {0, 0, 0}}
  1623. end.
  1624. -ifdef(TEST).
  1625. parse_expires_test_() ->
  1626. Tests = [
  1627. {<<"0">>, {{1, 1, 1}, {0, 0, 0}}},
  1628. {<<"Thu, 01 Dec 1994 nope invalid">>, {{1, 1, 1}, {0, 0, 0}}},
  1629. {<<"Thu, 01 Dec 1994 16:00:00 GMT">>, {{1994, 12, 1}, {16, 0, 0}}}
  1630. ],
  1631. [{V, fun() -> R = parse_expires(V) end} || {V, R} <- Tests].
  1632. horse_parse_expires_0() ->
  1633. horse:repeat(200000,
  1634. parse_expires(<<"0">>)
  1635. ).
  1636. horse_parse_expires_invalid() ->
  1637. horse:repeat(200000,
  1638. parse_expires(<<"Thu, 01 Dec 1994 nope invalid">>)
  1639. ).
  1640. -endif.
  1641. %% @doc Parse the Host header.
  1642. %%
  1643. %% We only seek to have legal characters and separate the
  1644. %% host and port values. The number of segments in the host
  1645. %% or the size of each segment is not checked.
  1646. %%
  1647. %% There is no way to distinguish IPv4 addresses from regular
  1648. %% names until the last segment is reached therefore we do not
  1649. %% differentiate them.
  1650. %%
  1651. %% The following valid hosts are currently rejected: IPv6
  1652. %% addresses with a zone identifier; IPvFuture addresses;
  1653. %% and percent-encoded addresses.
  1654. -spec parse_host(binary()) -> {binary(), 0..65535 | undefined}.
  1655. parse_host(<< $[, R/bits >>) ->
  1656. ipv6_address(R, << $[ >>);
  1657. parse_host(Host) ->
  1658. reg_name(Host, <<>>).
  1659. ipv6_address(<< $] >>, IP) -> {<< IP/binary, $] >>, undefined};
  1660. ipv6_address(<< $], $:, Port/bits >>, IP) -> {<< IP/binary, $] >>, binary_to_integer(Port)};
  1661. ipv6_address(<< C, R/bits >>, IP) when ?IS_HEX(C) or (C =:= $:) or (C =:= $.) ->
  1662. ?LOWER(ipv6_address, R, IP).
  1663. reg_name(<<>>, Name) -> {Name, undefined};
  1664. reg_name(<< $:, Port/bits >>, Name) -> {Name, binary_to_integer(Port)};
  1665. reg_name(<< C, R/bits >>, Name) when ?IS_URI_UNRESERVED(C) or ?IS_URI_SUB_DELIMS(C) ->
  1666. ?LOWER(reg_name, R, Name).
  1667. -ifdef(TEST).
  1668. host_chars() -> "!$&'()*+,-.0123456789;=ABCDEFGHIJKLMNOPQRSTUVWXYZ_abcdefghijklmnopqrstuvwxyz~".
  1669. host() -> vector(1, 255, elements(host_chars())).
  1670. host_port() ->
  1671. ?LET({Host, Port},
  1672. {host(), oneof([undefined, int(1, 65535)])},
  1673. begin
  1674. HostBin = list_to_binary(Host),
  1675. {{?LOWER(HostBin), Port},
  1676. case Port of
  1677. undefined -> HostBin;
  1678. _ -> << HostBin/binary, $:, (integer_to_binary(Port))/binary >>
  1679. end}
  1680. end).
  1681. prop_parse_host() ->
  1682. ?FORALL({Res, Host}, host_port(), Res =:= parse_host(Host)).
  1683. parse_host_test_() ->
  1684. Tests = [
  1685. {<<>>, {<<>>, undefined}},
  1686. {<<"www.example.org:8080">>, {<<"www.example.org">>, 8080}},
  1687. {<<"www.example.org">>, {<<"www.example.org">>, undefined}},
  1688. {<<"192.0.2.1:8080">>, {<<"192.0.2.1">>, 8080}},
  1689. {<<"192.0.2.1">>, {<<"192.0.2.1">>, undefined}},
  1690. {<<"[2001:db8::1]:8080">>, {<<"[2001:db8::1]">>, 8080}},
  1691. {<<"[2001:db8::1]">>, {<<"[2001:db8::1]">>, undefined}},
  1692. {<<"[::ffff:192.0.2.1]:8080">>, {<<"[::ffff:192.0.2.1]">>, 8080}},
  1693. {<<"[::ffff:192.0.2.1]">>, {<<"[::ffff:192.0.2.1]">>, undefined}}
  1694. ],
  1695. [{V, fun() -> R = parse_host(V) end} || {V, R} <- Tests].
  1696. horse_parse_host_blue_example_org() ->
  1697. horse:repeat(200000,
  1698. parse_host(<<"blue.example.org:8080">>)
  1699. ).
  1700. horse_parse_host_ipv4() ->
  1701. horse:repeat(200000,
  1702. parse_host(<<"192.0.2.1:8080">>)
  1703. ).
  1704. horse_parse_host_ipv6() ->
  1705. horse:repeat(200000,
  1706. parse_host(<<"[2001:db8::1]:8080">>)
  1707. ).
  1708. horse_parse_host_ipv6_v4() ->
  1709. horse:repeat(200000,
  1710. parse_host(<<"[::ffff:192.0.2.1]:8080">>)
  1711. ).
  1712. -endif.
  1713. %% @doc Parse the HTTP2-Settings header.
  1714. -spec parse_http2_settings(binary()) -> map().
  1715. parse_http2_settings(HTTP2Settings) ->
  1716. cow_http2:parse_settings_payload(base64:decode(HTTP2Settings)).
  1717. %% @doc Parse the If-Match header.
  1718. -spec parse_if_match(binary()) -> '*' | [etag()].
  1719. parse_if_match(<<"*">>) ->
  1720. '*';
  1721. parse_if_match(IfMatch) ->
  1722. nonempty(etag_list(IfMatch, [])).
  1723. etag_list(<<>>, Acc) -> lists:reverse(Acc);
  1724. etag_list(<< C, R/bits >>, Acc) when ?IS_WS_COMMA(C) -> etag_list(R, Acc);
  1725. etag_list(<< $W, $/, $", R/bits >>, Acc) -> etag(R, Acc, weak, <<>>);
  1726. etag_list(<< $", R/bits >>, Acc) -> etag(R, Acc, strong, <<>>).
  1727. etag(<< $", R/bits >>, Acc, Strength, Tag) -> etag_list_sep(R, [{Strength, Tag}|Acc]);
  1728. etag(<< C, R/bits >>, Acc, Strength, Tag) when ?IS_ETAGC(C) -> etag(R, Acc, Strength, << Tag/binary, C >>).
  1729. etag_list_sep(<<>>, Acc) -> lists:reverse(Acc);
  1730. etag_list_sep(<< C, R/bits >>, Acc) when ?IS_WS(C) -> etag_list_sep(R, Acc);
  1731. etag_list_sep(<< $,, R/bits >>, Acc) -> etag_list(R, Acc).
  1732. -ifdef(TEST).
  1733. prop_parse_if_match() ->
  1734. ?FORALL(L,
  1735. non_empty(list(etag())),
  1736. begin
  1737. << _, IfMatch/binary >> = iolist_to_binary([[$,, T] || {_, T} <- L]),
  1738. ResL = parse_if_match(IfMatch),
  1739. CheckedL = [T =:= ResT || {{T, _}, ResT} <- lists:zip(L, ResL)],
  1740. [true] =:= lists:usort(CheckedL)
  1741. end).
  1742. parse_if_match_test_() ->
  1743. Tests = [
  1744. {<<"\"xyzzy\"">>, [{strong, <<"xyzzy">>}]},
  1745. {<<"\"xyzzy\", \"r2d2xxxx\", \"c3piozzzz\"">>,
  1746. [{strong, <<"xyzzy">>}, {strong, <<"r2d2xxxx">>}, {strong, <<"c3piozzzz">>}]},
  1747. {<<"*">>, '*'}
  1748. ],
  1749. [{V, fun() -> R = parse_if_match(V) end} || {V, R} <- Tests].
  1750. parse_if_match_error_test_() ->
  1751. Tests = [
  1752. <<>>
  1753. ],
  1754. [{V, fun() -> {'EXIT', _} = (catch parse_if_match(V)) end} || V <- Tests].
  1755. horse_parse_if_match() ->
  1756. horse:repeat(200000,
  1757. parse_if_match(<<"\"xyzzy\", \"r2d2xxxx\", \"c3piozzzz\"">>)
  1758. ).
  1759. -endif.
  1760. %% @doc Parse the If-Modified-Since header.
  1761. -spec parse_if_modified_since(binary()) -> calendar:datetime().
  1762. parse_if_modified_since(IfModifiedSince) ->
  1763. cow_date:parse_date(IfModifiedSince).
  1764. -ifdef(TEST).
  1765. parse_if_modified_since_test_() ->
  1766. Tests = [
  1767. {<<"Sat, 29 Oct 1994 19:43:31 GMT">>, {{1994, 10, 29}, {19, 43, 31}}}
  1768. ],
  1769. [{V, fun() -> R = parse_if_modified_since(V) end} || {V, R} <- Tests].
  1770. -endif.
  1771. %% @doc Parse the If-None-Match header.
  1772. -spec parse_if_none_match(binary()) -> '*' | [etag()].
  1773. parse_if_none_match(<<"*">>) ->
  1774. '*';
  1775. parse_if_none_match(IfNoneMatch) ->
  1776. nonempty(etag_list(IfNoneMatch, [])).
  1777. -ifdef(TEST).
  1778. parse_if_none_match_test_() ->
  1779. Tests = [
  1780. {<<"\"xyzzy\"">>, [{strong, <<"xyzzy">>}]},
  1781. {<<"W/\"xyzzy\"">>, [{weak, <<"xyzzy">>}]},
  1782. {<<"\"xyzzy\", \"r2d2xxxx\", \"c3piozzzz\"">>,
  1783. [{strong, <<"xyzzy">>}, {strong, <<"r2d2xxxx">>}, {strong, <<"c3piozzzz">>}]},
  1784. {<<"W/\"xyzzy\", W/\"r2d2xxxx\", W/\"c3piozzzz\"">>,
  1785. [{weak, <<"xyzzy">>}, {weak, <<"r2d2xxxx">>}, {weak, <<"c3piozzzz">>}]},
  1786. {<<"*">>, '*'}
  1787. ],
  1788. [{V, fun() -> R = parse_if_none_match(V) end} || {V, R} <- Tests].
  1789. parse_if_none_match_error_test_() ->
  1790. Tests = [
  1791. <<>>
  1792. ],
  1793. [{V, fun() -> {'EXIT', _} = (catch parse_if_none_match(V)) end} || V <- Tests].
  1794. horse_parse_if_none_match() ->
  1795. horse:repeat(200000,
  1796. parse_if_none_match(<<"W/\"xyzzy\", W/\"r2d2xxxx\", W/\"c3piozzzz\"">>)
  1797. ).
  1798. -endif.
  1799. %% @doc Parse the If-Range header.
  1800. -spec parse_if_range(binary()) -> etag() | calendar:datetime().
  1801. parse_if_range(<< $W, $/, $", R/bits >>) ->
  1802. etag(R, weak, <<>>);
  1803. parse_if_range(<< $", R/bits >>) ->
  1804. etag(R, strong, <<>>);
  1805. parse_if_range(IfRange) ->
  1806. cow_date:parse_date(IfRange).
  1807. -ifdef(TEST).
  1808. parse_if_range_test_() ->
  1809. Tests = [
  1810. {<<"W/\"xyzzy\"">>, {weak, <<"xyzzy">>}},
  1811. {<<"\"xyzzy\"">>, {strong, <<"xyzzy">>}},
  1812. {<<"Sat, 29 Oct 1994 19:43:31 GMT">>, {{1994, 10, 29}, {19, 43, 31}}}
  1813. ],
  1814. [{V, fun() -> R = parse_if_range(V) end} || {V, R} <- Tests].
  1815. parse_if_range_error_test_() ->
  1816. Tests = [
  1817. <<>>
  1818. ],
  1819. [{V, fun() -> {'EXIT', _} = (catch parse_if_range(V)) end} || V <- Tests].
  1820. horse_parse_if_range_etag() ->
  1821. horse:repeat(200000,
  1822. parse_if_range(<<"\"xyzzy\"">>)
  1823. ).
  1824. horse_parse_if_range_date() ->
  1825. horse:repeat(200000,
  1826. parse_if_range(<<"Sat, 29 Oct 1994 19:43:31 GMT">>)
  1827. ).
  1828. -endif.
  1829. %% @doc Parse the If-Unmodified-Since header.
  1830. -spec parse_if_unmodified_since(binary()) -> calendar:datetime().
  1831. parse_if_unmodified_since(IfModifiedSince) ->
  1832. cow_date:parse_date(IfModifiedSince).
  1833. -ifdef(TEST).
  1834. parse_if_unmodified_since_test_() ->
  1835. Tests = [
  1836. {<<"Sat, 29 Oct 1994 19:43:31 GMT">>, {{1994, 10, 29}, {19, 43, 31}}}
  1837. ],
  1838. [{V, fun() -> R = parse_if_unmodified_since(V) end} || {V, R} <- Tests].
  1839. -endif.
  1840. %% @doc Parse the Last-Modified header.
  1841. -spec parse_last_modified(binary()) -> calendar:datetime().
  1842. parse_last_modified(LastModified) ->
  1843. cow_date:parse_date(LastModified).
  1844. -ifdef(TEST).
  1845. parse_last_modified_test_() ->
  1846. Tests = [
  1847. {<<"Tue, 15 Nov 1994 12:45:26 GMT">>, {{1994, 11, 15}, {12, 45, 26}}}
  1848. ],
  1849. [{V, fun() -> R = parse_last_modified(V) end} || {V, R} <- Tests].
  1850. -endif.
  1851. %% @doc Parse the Max-Forwards header.
  1852. -spec parse_max_forwards(binary()) -> non_neg_integer().
  1853. parse_max_forwards(MaxForwards) ->
  1854. I = binary_to_integer(MaxForwards),
  1855. true = I >= 0,
  1856. I.
  1857. -ifdef(TEST).
  1858. prop_parse_max_forwards() ->
  1859. ?FORALL(
  1860. X,
  1861. non_neg_integer(),
  1862. X =:= parse_max_forwards(integer_to_binary(X))
  1863. ).
  1864. parse_max_forwards_test_() ->
  1865. Tests = [
  1866. {<<"0">>, 0},
  1867. {<<"42">>, 42},
  1868. {<<"69">>, 69},
  1869. {<<"1337">>, 1337},
  1870. {<<"1234567890">>, 1234567890}
  1871. ],
  1872. [{V, fun() -> R = parse_max_forwards(V) end} || {V, R} <- Tests].
  1873. parse_max_forwards_error_test_() ->
  1874. Tests = [
  1875. <<>>,
  1876. <<"123, 123">>,
  1877. <<"4.17">>
  1878. ],
  1879. [{V, fun() -> {'EXIT', _} = (catch parse_max_forwards(V)) end} || V <- Tests].
  1880. -endif.
  1881. %% @doc Parse the Origin header.
  1882. %% According to the RFC6454 we should generate
  1883. %% a fresh globally unique identifier and return that value if:
  1884. %% - URI does not use a hierarchical element as a naming authority
  1885. %% or the URI is not an absolute URI
  1886. %% - the implementation doesn't support the protocol given by uri-scheme
  1887. %% Thus, erlang reference represents a GUID here.
  1888. %%
  1889. %% We only seek to have legal characters and separate the
  1890. %% host and port values. The number of segments in the host
  1891. %% or the size of each segment is not checked.
  1892. %%
  1893. %% There is no way to distinguish IPv4 addresses from regular
  1894. %% names until the last segment is reached therefore we do not
  1895. %% differentiate them.
  1896. %%
  1897. %% @todo The following valid hosts are currently rejected: IPv6
  1898. %% addresses with a zone identifier; IPvFuture addresses;
  1899. %% and percent-encoded addresses.
  1900. -spec parse_origin(binary()) -> [{binary(), binary(), 0..65535} | reference()].
  1901. parse_origin(Origins) ->
  1902. nonempty(origin_scheme(Origins, [])).
  1903. origin_scheme(<<>>, Acc) -> Acc;
  1904. origin_scheme(<< "http://", R/bits >>, Acc) -> origin_host(R, Acc, <<"http">>);
  1905. origin_scheme(<< "https://", R/bits >>, Acc) -> origin_host(R, Acc, <<"https">>);
  1906. origin_scheme(<< C, R/bits >>, Acc) when ?IS_TOKEN(C) -> origin_scheme(next_origin(R), [make_ref()|Acc]).
  1907. origin_host(<< $[, R/bits >>, Acc, Scheme) -> origin_ipv6_address(R, Acc, Scheme, << $[ >>);
  1908. origin_host(Host, Acc, Scheme) -> origin_reg_name(Host, Acc, Scheme, <<>>).
  1909. origin_ipv6_address(<< $] >>, Acc, Scheme, IP) ->
  1910. lists:reverse([{Scheme, << IP/binary, $] >>, default_port(Scheme)}|Acc]);
  1911. origin_ipv6_address(<< $], $\s, R/bits >>, Acc, Scheme, IP) ->
  1912. origin_scheme(R, [{Scheme, << IP/binary, $] >>, default_port(Scheme)}|Acc]);
  1913. origin_ipv6_address(<< $], $:, Port/bits >>, Acc, Scheme, IP) ->
  1914. origin_port(Port, Acc, Scheme, << IP/binary, $] >>, <<>>);
  1915. origin_ipv6_address(<< C, R/bits >>, Acc, Scheme, IP) when ?IS_HEX(C) or (C =:= $:) or (C =:= $.) ->
  1916. ?LOWER(origin_ipv6_address, R, Acc, Scheme, IP).
  1917. origin_reg_name(<<>>, Acc, Scheme, Name) ->
  1918. lists:reverse([{Scheme, Name, default_port(Scheme)}|Acc]);
  1919. origin_reg_name(<< $\s, R/bits >>, Acc, Scheme, Name) ->
  1920. origin_scheme(R, [{Scheme, Name, default_port(Scheme)}|Acc]);
  1921. origin_reg_name(<< $:, Port/bits >>, Acc, Scheme, Name) ->
  1922. origin_port(Port, Acc, Scheme, Name, <<>>);
  1923. origin_reg_name(<< C, R/bits >>, Acc, Scheme, Name) when ?IS_URI_UNRESERVED(C) or ?IS_URI_SUB_DELIMS(C) ->
  1924. ?LOWER(origin_reg_name, R, Acc, Scheme, Name).
  1925. origin_port(<<>>, Acc, Scheme, Host, Port) ->
  1926. lists:reverse([{Scheme, Host, binary_to_integer(Port)}|Acc]);
  1927. origin_port(<< $\s, R/bits >>, Acc, Scheme, Host, Port) ->
  1928. origin_scheme(R, [{Scheme, Host, binary_to_integer(Port)}|Acc]);
  1929. origin_port(<< C, R/bits >>, Acc, Scheme, Host, Port) when ?IS_DIGIT(C) ->
  1930. origin_port(R, Acc, Scheme, Host, << Port/binary, C >>).
  1931. next_origin(<<>>) -> <<>>;
  1932. next_origin(<< $\s, C, R/bits >>) when ?IS_TOKEN(C) -> << C, R/bits >>;
  1933. next_origin(<< C, R/bits >>) when ?IS_TOKEN(C) or (C =:= $:) or (C =:= $/) -> next_origin(R).
  1934. default_port(<< "http" >>) -> 80;
  1935. default_port(<< "https" >>) -> 443.
  1936. -ifdef(TEST).
  1937. scheme() -> oneof([<<"http">>, <<"https">>]).
  1938. scheme_host_port() ->
  1939. ?LET({Scheme, Host, Port},
  1940. {scheme(), host(), int(1, 65535)},
  1941. begin
  1942. HostBin = list_to_binary(Host),
  1943. {[{Scheme, ?LOWER(HostBin), Port}],
  1944. case default_port(Scheme) of
  1945. Port -> << Scheme/binary, "://", HostBin/binary>>;
  1946. _ -> << Scheme/binary, "://", HostBin/binary, $:, (integer_to_binary(Port))/binary >>
  1947. end}
  1948. end).
  1949. prop_parse_origin() ->
  1950. ?FORALL({Res, Origin}, scheme_host_port(), Res =:= parse_origin(Origin)).
  1951. parse_origin_test_() ->
  1952. Tests = [
  1953. {<<"http://www.example.org:8080">>, [{<<"http">>, <<"www.example.org">>, 8080}]},
  1954. {<<"http://www.example.org">>, [{<<"http">>, <<"www.example.org">>, 80}]},
  1955. {<<"http://192.0.2.1:8080">>, [{<<"http">>, <<"192.0.2.1">>, 8080}]},
  1956. {<<"http://192.0.2.1">>, [{<<"http">>, <<"192.0.2.1">>, 80}]},
  1957. {<<"http://[2001:db8::1]:8080">>, [{<<"http">>, <<"[2001:db8::1]">>, 8080}]},
  1958. {<<"http://[2001:db8::1]">>, [{<<"http">>, <<"[2001:db8::1]">>, 80}]},
  1959. {<<"http://[::ffff:192.0.2.1]:8080">>, [{<<"http">>, <<"[::ffff:192.0.2.1]">>, 8080}]},
  1960. {<<"http://[::ffff:192.0.2.1]">>, [{<<"http">>, <<"[::ffff:192.0.2.1]">>, 80}]},
  1961. {<<"http://example.org https://blue.example.com:8080">>,
  1962. [{<<"http">>, <<"example.org">>, 80},
  1963. {<<"https">>, <<"blue.example.com">>, 8080}]}
  1964. ],
  1965. [{V, fun() -> R = parse_origin(V) end} || {V, R} <- Tests].
  1966. parse_origin_reference_test_() ->
  1967. Tests = [
  1968. <<"null">>,
  1969. <<"httpx://example.org:80">>,
  1970. <<"httpx://example.org:80 null">>,
  1971. <<"null null">>
  1972. ],
  1973. [{V, fun() -> [true = is_reference(Ref) || Ref <- parse_origin(V)] end} || V <- Tests].
  1974. parse_origin_error_test_() ->
  1975. Tests = [
  1976. <<>>,
  1977. <<"null", $\t, "null">>,
  1978. <<"null", $\s, $\s, "null">>
  1979. ],
  1980. [{V, fun() -> {'EXIT', _} = (catch parse_origin(V)) end} || V <- Tests].
  1981. horse_parse_origin_blue_example_org() ->
  1982. horse:repeat(200000,
  1983. parse_origin(<<"http://blue.example.org:8080">>)
  1984. ).
  1985. horse_parse_origin_ipv4() ->
  1986. horse:repeat(200000,
  1987. parse_origin(<<"http://192.0.2.1:8080">>)
  1988. ).
  1989. horse_parse_origin_ipv6() ->
  1990. horse:repeat(200000,
  1991. parse_origin(<<"http://[2001:db8::1]:8080">>)
  1992. ).
  1993. horse_parse_origin_ipv6_v4() ->
  1994. horse:repeat(200000,
  1995. parse_origin(<<"http://[::ffff:192.0.2.1]:8080">>)
  1996. ).
  1997. horse_parse_origin_null() ->
  1998. horse:repeat(200000,
  1999. parse_origin(<<"null">>)
  2000. ).
  2001. -endif.
  2002. %% @doc Parse the Pragma header.
  2003. %%
  2004. %% Legacy header kept for backward compatibility with HTTP/1.0 caches.
  2005. %% Only the "no-cache" directive was ever specified, and only for
  2006. %% request messages.
  2007. %%
  2008. %% We take a large shortcut in the parsing of this header, expecting
  2009. %% an exact match of "no-cache".
  2010. -spec parse_pragma(binary()) -> cache | no_cache.
  2011. parse_pragma(<<"no-cache">>) -> no_cache;
  2012. parse_pragma(_) -> cache.
  2013. %% @doc Parse the Proxy-Authenticate header.
  2014. %%
  2015. %% Alias of parse_www_authenticate/1 due to identical syntax.
  2016. -spec parse_proxy_authenticate(binary()) -> [{basic, binary()}
  2017. | {bearer | digest | binary(), [{binary(), binary()}]}].
  2018. parse_proxy_authenticate(ProxyAuthenticate) ->
  2019. parse_www_authenticate(ProxyAuthenticate).
  2020. %% @doc Parse the Proxy-Authorization header.
  2021. %%
  2022. %% Alias of parse_authorization/1 due to identical syntax.
  2023. -spec parse_proxy_authorization(binary())
  2024. -> {basic, binary(), binary()}
  2025. | {bearer, binary()}
  2026. | {digest, [{binary(), binary()}]}.
  2027. parse_proxy_authorization(ProxyAuthorization) ->
  2028. parse_authorization(ProxyAuthorization).
  2029. %% @doc Parse the Range header.
  2030. -spec parse_range(binary())
  2031. -> {bytes, [{non_neg_integer(), non_neg_integer() | infinity} | neg_integer()]}
  2032. | {binary(), binary()}.
  2033. parse_range(<<"bytes=", R/bits >>) ->
  2034. bytes_range_set(R, []);
  2035. parse_range(<< C, R/bits >>) when ?IS_TOKEN(C) ->
  2036. ?LOWER(other_range_unit, R, <<>>).
  2037. bytes_range_set(<<>>, Acc) -> {bytes, lists:reverse(Acc)};
  2038. bytes_range_set(<< C, R/bits >>, Acc) when ?IS_WS_COMMA(C) -> bytes_range_set(R, Acc);
  2039. bytes_range_set(<< $-, C, R/bits >>, Acc) when ?IS_DIGIT(C) -> bytes_range_suffix_spec(R, Acc, C - $0);
  2040. bytes_range_set(<< C, R/bits >>, Acc) when ?IS_DIGIT(C) -> bytes_range_spec(R, Acc, C - $0).
  2041. bytes_range_spec(<< $-, C, R/bits >>, Acc, First) when ?IS_DIGIT(C) -> bytes_range_spec_last(R, Acc, First, C - $0);
  2042. bytes_range_spec(<< $-, R/bits >>, Acc, First) -> bytes_range_set_sep(R, [{First, infinity}|Acc]);
  2043. bytes_range_spec(<< C, R/bits >>, Acc, First) when ?IS_DIGIT(C) -> bytes_range_spec(R, Acc, First * 10 + C - $0).
  2044. bytes_range_spec_last(<< C, R/bits >>, Acc, First, Last) when ?IS_DIGIT(C) -> bytes_range_spec_last(R, Acc, First, Last * 10 + C - $0);
  2045. bytes_range_spec_last(R, Acc, First, Last) -> bytes_range_set_sep(R, [{First, Last}|Acc]).
  2046. bytes_range_suffix_spec(<< C, R/bits >>, Acc, Suffix) when ?IS_DIGIT(C) -> bytes_range_suffix_spec(R, Acc, Suffix * 10 + C - $0);
  2047. bytes_range_suffix_spec(R, Acc, Suffix) -> bytes_range_set_sep(R, [-Suffix|Acc]).
  2048. bytes_range_set_sep(<<>>, Acc) -> {bytes, lists:reverse(Acc)};
  2049. bytes_range_set_sep(<< C, R/bits >>, Acc) when ?IS_WS(C) -> bytes_range_set_sep(R, Acc);
  2050. bytes_range_set_sep(<< $,, R/bits >>, Acc) -> bytes_range_set(R, Acc).
  2051. other_range_unit(<< $=, C, R/bits >>, U) when ?IS_VCHAR(C) ->
  2052. other_range_set(R, U, << C >>);
  2053. other_range_unit(<< C, R/bits >>, U) when ?IS_TOKEN(C) ->
  2054. ?LOWER(other_range_unit, R, U).
  2055. other_range_set(<<>>, U, S) ->
  2056. {U, S};
  2057. other_range_set(<< C, R/bits >>, U, S) when ?IS_VCHAR(C) ->
  2058. other_range_set(R, U, << S/binary, C >>).
  2059. -ifdef(TEST).
  2060. bytes_range() ->
  2061. ?LET(BytesSet,
  2062. non_empty(list(oneof([
  2063. ?SUCHTHAT({First, Last}, {pos_integer(), pos_integer()}, First =< Last),
  2064. {pos_integer(), infinity},
  2065. ?LET(I, pos_integer(), -I)
  2066. ]))),
  2067. {{bytes, BytesSet}, begin
  2068. << _, Set/bits >> = iolist_to_binary([
  2069. case Spec of
  2070. {First, infinity} -> [$,, integer_to_binary(First), $-];
  2071. {First, Last} -> [$,, integer_to_binary(First), $-, integer_to_binary(Last)];
  2072. Suffix -> [$,, integer_to_binary(Suffix)]
  2073. end || Spec <- BytesSet]),
  2074. <<"bytes=", Set/binary >>
  2075. end}).
  2076. other_range() ->
  2077. ?LET(Range = {Unit, Set},
  2078. {token(), ?LET(L, non_empty(list(vchar())), list_to_binary(L))},
  2079. {Range, << Unit/binary, $=, Set/binary >>}).
  2080. range() ->
  2081. oneof([
  2082. bytes_range(),
  2083. other_range()
  2084. ]).
  2085. prop_parse_range() ->
  2086. ?FORALL({Range, RangeBin},
  2087. range(),
  2088. begin
  2089. Range2 = case Range of
  2090. {bytes, _} -> Range;
  2091. {Unit, Set} -> {?LOWER(Unit), Set}
  2092. end,
  2093. Range2 =:= parse_range(RangeBin)
  2094. end).
  2095. parse_range_test_() ->
  2096. Tests = [
  2097. {<<"bytes=0-499">>, {bytes, [{0, 499}]}},
  2098. {<<"bytes=500-999">>, {bytes, [{500, 999}]}},
  2099. {<<"bytes=-500">>, {bytes, [-500]}},
  2100. {<<"bytes=9500-">>, {bytes, [{9500, infinity}]}},
  2101. {<<"bytes=0-0,-1">>, {bytes, [{0, 0}, -1]}},
  2102. {<<"bytes=500-600,601-999">>, {bytes, [{500, 600}, {601, 999}]}},
  2103. {<<"bytes=500-700,601-999">>, {bytes, [{500, 700}, {601, 999}]}},
  2104. {<<"books=I-III,V-IX">>, {<<"books">>, <<"I-III,V-IX">>}}
  2105. ],
  2106. [{V, fun() -> R = parse_range(V) end} || {V, R} <- Tests].
  2107. parse_range_error_test_() ->
  2108. Tests = [
  2109. <<>>
  2110. ],
  2111. [{V, fun() -> {'EXIT', _} = (catch parse_range(V)) end} || V <- Tests].
  2112. horse_parse_range_first_last() ->
  2113. horse:repeat(200000,
  2114. parse_range(<<"bytes=500-999">>)
  2115. ).
  2116. horse_parse_range_infinity() ->
  2117. horse:repeat(200000,
  2118. parse_range(<<"bytes=9500-">>)
  2119. ).
  2120. horse_parse_range_suffix() ->
  2121. horse:repeat(200000,
  2122. parse_range(<<"bytes=-500">>)
  2123. ).
  2124. horse_parse_range_two() ->
  2125. horse:repeat(200000,
  2126. parse_range(<<"bytes=500-700,601-999">>)
  2127. ).
  2128. horse_parse_range_other() ->
  2129. horse:repeat(200000,
  2130. parse_range(<<"books=I-III,V-IX">>)
  2131. ).
  2132. -endif.
  2133. %% @doc Parse the Retry-After header.
  2134. -spec parse_retry_after(binary()) -> non_neg_integer() | calendar:datetime().
  2135. parse_retry_after(RetryAfter = << D, _/bits >>) when ?IS_DIGIT(D) ->
  2136. I = binary_to_integer(RetryAfter),
  2137. true = I >= 0,
  2138. I;
  2139. parse_retry_after(RetryAfter) ->
  2140. cow_date:parse_date(RetryAfter).
  2141. -ifdef(TEST).
  2142. parse_retry_after_test_() ->
  2143. Tests = [
  2144. {<<"Fri, 31 Dec 1999 23:59:59 GMT">>, {{1999, 12, 31}, {23, 59, 59}}},
  2145. {<<"120">>, 120}
  2146. ],
  2147. [{V, fun() -> R = parse_retry_after(V) end} || {V, R} <- Tests].
  2148. parse_retry_after_error_test_() ->
  2149. Tests = [
  2150. <<>>
  2151. ],
  2152. [{V, fun() -> {'EXIT', _} = (catch parse_retry_after(V)) end} || V <- Tests].
  2153. horse_parse_retry_after_date() ->
  2154. horse:repeat(200000,
  2155. parse_retry_after(<<"Fri, 31 Dec 1999 23:59:59 GMT">>)
  2156. ).
  2157. horse_parse_retry_after_delay_seconds() ->
  2158. horse:repeat(200000,
  2159. parse_retry_after(<<"120">>)
  2160. ).
  2161. -endif.
  2162. %% @doc Dummy parsing function for the Sec-WebSocket-Accept header.
  2163. %%
  2164. %% The argument is returned without any processing. This value is
  2165. %% expected to be matched directly by the client so no parsing is
  2166. %% needed.
  2167. -spec parse_sec_websocket_accept(binary()) -> binary().
  2168. parse_sec_websocket_accept(SecWebSocketAccept) ->
  2169. SecWebSocketAccept.
  2170. %% @doc Parse the Sec-WebSocket-Extensions request header.
  2171. -spec parse_sec_websocket_extensions(binary()) -> [{binary(), [binary() | {binary(), binary()}]}].
  2172. parse_sec_websocket_extensions(SecWebSocketExtensions) ->
  2173. nonempty(ws_extension_list(SecWebSocketExtensions, [])).
  2174. ws_extension_list(<<>>, Acc) -> lists:reverse(Acc);
  2175. ws_extension_list(<< C, R/bits >>, Acc) when ?IS_WS_COMMA(C) -> ws_extension_list(R, Acc);
  2176. ws_extension_list(<< C, R/bits >>, Acc) when ?IS_TOKEN(C) -> ws_extension(R, Acc, << C >>).
  2177. ws_extension(<< C, R/bits >>, Acc, E) when ?IS_TOKEN(C) -> ws_extension(R, Acc, << E/binary, C >>);
  2178. ws_extension(R, Acc, E) -> ws_extension_param_sep(R, Acc, E, []).
  2179. ws_extension_param_sep(<<>>, Acc, E, P) -> lists:reverse([{E, lists:reverse(P)}|Acc]);
  2180. ws_extension_param_sep(<< $,, R/bits >>, Acc, E, P) -> ws_extension_list(R, [{E, lists:reverse(P)}|Acc]);
  2181. ws_extension_param_sep(<< $;, R/bits >>, Acc, E, P) -> ws_extension_before_param(R, Acc, E, P);
  2182. ws_extension_param_sep(<< C, R/bits >>, Acc, E, P) when ?IS_WS(C) -> ws_extension_param_sep(R, Acc, E, P).
  2183. ws_extension_before_param(<< C, R/bits >>, Acc, E, P) when ?IS_WS(C) -> ws_extension_before_param(R, Acc, E, P);
  2184. ws_extension_before_param(<< C, R/bits >>, Acc, E, P) when ?IS_TOKEN(C) -> ws_extension_param(R, Acc, E, P, << C >>).
  2185. ws_extension_param(<< $=, $", R/bits >>, Acc, E, P, K) -> ws_extension_quoted(R, Acc, E, P, K, <<>>);
  2186. ws_extension_param(<< $=, C, R/bits >>, Acc, E, P, K) when ?IS_TOKEN(C) -> ws_extension_value(R, Acc, E, P, K, << C >>);
  2187. ws_extension_param(<< C, R/bits >>, Acc, E, P, K) when ?IS_TOKEN(C) -> ws_extension_param(R, Acc, E, P, << K/binary, C >>);
  2188. ws_extension_param(R, Acc, E, P, K) -> ws_extension_param_sep(R, Acc, E, [K|P]).
  2189. ws_extension_quoted(<< $", R/bits >>, Acc, E, P, K, V) -> ws_extension_param_sep(R, Acc, E, [{K, V}|P]);
  2190. ws_extension_quoted(<< $\\, C, R/bits >>, Acc, E, P, K, V) when ?IS_TOKEN(C) -> ws_extension_quoted(R, Acc, E, P, K, << V/binary, C >>);
  2191. ws_extension_quoted(<< C, R/bits >>, Acc, E, P, K, V) when ?IS_TOKEN(C) -> ws_extension_quoted(R, Acc, E, P, K, << V/binary, C >>).
  2192. ws_extension_value(<< C, R/bits >>, Acc, E, P, K, V) when ?IS_TOKEN(C) -> ws_extension_value(R, Acc, E, P, K, << V/binary, C >>);
  2193. ws_extension_value(R, Acc, E, P, K, V) -> ws_extension_param_sep(R, Acc, E, [{K, V}|P]).
  2194. -ifdef(TEST).
  2195. quoted_token() ->
  2196. ?LET(T,
  2197. non_empty(list(frequency([
  2198. {99, tchar()},
  2199. {1, [$\\, tchar()]}
  2200. ]))),
  2201. [$", T, $"]).
  2202. ws_extension() ->
  2203. ?LET({E, PL},
  2204. {token(), small_list({ows(), ows(), oneof([token(), {token(), oneof([token(), quoted_token()])}])})},
  2205. {E, PL, iolist_to_binary([E,
  2206. [case P of
  2207. {OWS1, OWS2, {K, V}} -> [OWS1, $;, OWS2, K, $=, V];
  2208. {OWS1, OWS2, K} -> [OWS1, $;, OWS2, K]
  2209. end || P <- PL]
  2210. ])}).
  2211. prop_parse_sec_websocket_extensions() ->
  2212. ?FORALL(L,
  2213. vector(1, 50, ws_extension()),
  2214. begin
  2215. << _, SecWebsocketExtensions/binary >> = iolist_to_binary([[$,, E] || {_, _, E} <- L]),
  2216. ResL = parse_sec_websocket_extensions(SecWebsocketExtensions),
  2217. CheckedL = [begin
  2218. ExpectedPL = [case P of
  2219. {_, _, {K, V}} -> {K, unquote(V)};
  2220. {_, _, K} -> K
  2221. end || P <- PL],
  2222. E =:= ResE andalso ExpectedPL =:= ResPL
  2223. end || {{E, PL, _}, {ResE, ResPL}} <- lists:zip(L, ResL)],
  2224. [true] =:= lists:usort(CheckedL)
  2225. end).
  2226. parse_sec_websocket_extensions_test_() ->
  2227. Tests = [
  2228. {<<"foo">>, [{<<"foo">>, []}]},
  2229. {<<"bar; baz=2">>, [{<<"bar">>, [{<<"baz">>, <<"2">>}]}]},
  2230. {<<"foo, bar; baz=2">>, [{<<"foo">>, []}, {<<"bar">>, [{<<"baz">>, <<"2">>}]}]},
  2231. {<<"deflate-stream">>, [{<<"deflate-stream">>, []}]},
  2232. {<<"mux; max-channels=4; flow-control, deflate-stream">>,
  2233. [{<<"mux">>, [{<<"max-channels">>, <<"4">>}, <<"flow-control">>]}, {<<"deflate-stream">>, []}]},
  2234. {<<"private-extension">>, [{<<"private-extension">>, []}]}
  2235. ],
  2236. [{V, fun() -> R = parse_sec_websocket_extensions(V) end} || {V, R} <- Tests].
  2237. parse_sec_websocket_extensions_error_test_() ->
  2238. Tests = [
  2239. <<>>
  2240. ],
  2241. [{V, fun() -> {'EXIT', _} = (catch parse_sec_websocket_extensions(V)) end}
  2242. || V <- Tests].
  2243. horse_parse_sec_websocket_extensions() ->
  2244. horse:repeat(200000,
  2245. parse_sec_websocket_extensions(<<"mux; max-channels=4; flow-control, deflate-stream">>)
  2246. ).
  2247. -endif.
  2248. %% @doc Dummy parsing function for the Sec-WebSocket-Key header.
  2249. %%
  2250. %% The argument is returned without any processing. This value is
  2251. %% expected to be prepended to a static value, the result of which
  2252. %% hashed to form a new base64 value returned in Sec-WebSocket-Accept,
  2253. %% therefore no parsing is needed.
  2254. -spec parse_sec_websocket_key(binary()) -> binary().
  2255. parse_sec_websocket_key(SecWebSocketKey) ->
  2256. SecWebSocketKey.
  2257. %% @doc Parse the Sec-WebSocket-Protocol request header.
  2258. -spec parse_sec_websocket_protocol_req(binary()) -> [binary()].
  2259. parse_sec_websocket_protocol_req(SecWebSocketProtocol) ->
  2260. nonempty(token_ci_list(SecWebSocketProtocol, [])).
  2261. -ifdef(TEST).
  2262. parse_sec_websocket_protocol_req_test_() ->
  2263. Tests = [
  2264. {<<"chat, superchat">>, [<<"chat">>, <<"superchat">>]}
  2265. ],
  2266. [{V, fun() -> R = parse_sec_websocket_protocol_req(V) end} || {V, R} <- Tests].
  2267. parse_sec_websocket_protocol_req_error_test_() ->
  2268. Tests = [
  2269. <<>>
  2270. ],
  2271. [{V, fun() -> {'EXIT', _} = (catch parse_sec_websocket_protocol_req(V)) end}
  2272. || V <- Tests].
  2273. horse_parse_sec_websocket_protocol_req() ->
  2274. horse:repeat(200000,
  2275. parse_sec_websocket_protocol_req(<<"chat, superchat">>)
  2276. ).
  2277. -endif.
  2278. %% @doc Parse the Sec-Websocket-Protocol response header.
  2279. -spec parse_sec_websocket_protocol_resp(binary()) -> binary().
  2280. parse_sec_websocket_protocol_resp(<< C, R/bits >>) when ?IS_TOKEN(C) ->
  2281. ?LOWER(token_ci, R, <<>>).
  2282. token_ci(<<>>, T) -> T;
  2283. token_ci(<< C, R/bits >>, T) when ?IS_TOKEN(C) ->
  2284. ?LOWER(token_ci, R, T).
  2285. -ifdef(TEST).
  2286. prop_parse_sec_websocket_protocol_resp() ->
  2287. ?FORALL(T,
  2288. token(),
  2289. ?LOWER(T) =:= parse_sec_websocket_protocol_resp(T)).
  2290. parse_sec_websocket_protocol_resp_test_() ->
  2291. Tests = [
  2292. {<<"chat">>, <<"chat">>},
  2293. {<<"CHAT">>, <<"chat">>}
  2294. ],
  2295. [{V, fun() -> R = parse_sec_websocket_protocol_resp(V) end} || {V, R} <- Tests].
  2296. parse_sec_websocket_protocol_resp_error_test_() ->
  2297. Tests = [
  2298. <<>>
  2299. ],
  2300. [{V, fun() -> {'EXIT', _} = (catch parse_sec_websocket_protocol_resp(V)) end}
  2301. || V <- Tests].
  2302. horse_parse_sec_websocket_protocol_resp() ->
  2303. horse:repeat(200000,
  2304. parse_sec_websocket_protocol_resp(<<"chat">>)
  2305. ).
  2306. -endif.
  2307. %% @doc Parse the Sec-WebSocket-Version request header.
  2308. -spec parse_sec_websocket_version_req(binary()) -> websocket_version().
  2309. parse_sec_websocket_version_req(SecWebSocketVersion) when byte_size(SecWebSocketVersion) < 4 ->
  2310. Version = binary_to_integer(SecWebSocketVersion),
  2311. true = Version >= 0 andalso Version =< 255,
  2312. Version.
  2313. -ifdef(TEST).
  2314. prop_parse_sec_websocket_version_req() ->
  2315. ?FORALL(Version,
  2316. int(0, 255),
  2317. Version =:= parse_sec_websocket_version_req(integer_to_binary(Version))).
  2318. parse_sec_websocket_version_req_test_() ->
  2319. Tests = [
  2320. {<<"13">>, 13},
  2321. {<<"25">>, 25}
  2322. ],
  2323. [{V, fun() -> R = parse_sec_websocket_version_req(V) end} || {V, R} <- Tests].
  2324. parse_sec_websocket_version_req_error_test_() ->
  2325. Tests = [
  2326. <<>>,
  2327. <<" ">>,
  2328. <<"7, 8, 13">>,
  2329. <<"invalid">>
  2330. ],
  2331. [{V, fun() -> {'EXIT', _} = (catch parse_sec_websocket_version_req(V)) end}
  2332. || V <- Tests].
  2333. horse_parse_sec_websocket_version_req_13() ->
  2334. horse:repeat(200000,
  2335. parse_sec_websocket_version_req(<<"13">>)
  2336. ).
  2337. horse_parse_sec_websocket_version_req_255() ->
  2338. horse:repeat(200000,
  2339. parse_sec_websocket_version_req(<<"255">>)
  2340. ).
  2341. -endif.
  2342. %% @doc Parse the Sec-WebSocket-Version response header.
  2343. -spec parse_sec_websocket_version_resp(binary()) -> [websocket_version()].
  2344. parse_sec_websocket_version_resp(SecWebSocketVersion) ->
  2345. nonempty(ws_version_list(SecWebSocketVersion, [])).
  2346. ws_version_list(<<>>, Acc) -> lists:reverse(Acc);
  2347. ws_version_list(<< C, R/bits >>, Acc) when ?IS_WS_COMMA(C) -> ws_version_list(R, Acc);
  2348. ws_version_list(<< C, R/bits >>, Acc) when ?IS_DIGIT(C) -> ws_version(R, Acc, C - $0).
  2349. ws_version(<< C, R/bits >>, Acc, V) when ?IS_DIGIT(C) -> ws_version(R, Acc, V * 10 + C - $0);
  2350. ws_version(R, Acc, V) -> ws_version_list_sep(R, [V|Acc]).
  2351. ws_version_list_sep(<<>>, Acc) -> lists:reverse(Acc);
  2352. ws_version_list_sep(<< C, R/bits >>, Acc) when ?IS_WS(C) -> ws_version_list_sep(R, Acc);
  2353. ws_version_list_sep(<< $,, R/bits >>, Acc) -> ws_version_list(R, Acc).
  2354. -ifdef(TEST).
  2355. sec_websocket_version_resp() ->
  2356. ?LET(L,
  2357. non_empty(list({ows(), ows(), int(0, 255)})),
  2358. begin
  2359. << _, SecWebSocketVersion/binary >> = iolist_to_binary(
  2360. [[OWS1, $,, OWS2, integer_to_binary(V)] || {OWS1, OWS2, V} <- L]),
  2361. {[V || {_, _, V} <- L], SecWebSocketVersion}
  2362. end).
  2363. prop_parse_sec_websocket_version_resp() ->
  2364. ?FORALL({L, SecWebSocketVersion},
  2365. sec_websocket_version_resp(),
  2366. L =:= parse_sec_websocket_version_resp(SecWebSocketVersion)).
  2367. parse_sec_websocket_version_resp_test_() ->
  2368. Tests = [
  2369. {<<"13, 8, 7">>, [13, 8, 7]}
  2370. ],
  2371. [{V, fun() -> R = parse_sec_websocket_version_resp(V) end} || {V, R} <- Tests].
  2372. parse_sec_websocket_version_resp_error_test_() ->
  2373. Tests = [
  2374. <<>>
  2375. ],
  2376. [{V, fun() -> {'EXIT', _} = (catch parse_sec_websocket_version_resp(V)) end}
  2377. || V <- Tests].
  2378. horse_parse_sec_websocket_version_resp() ->
  2379. horse:repeat(200000,
  2380. parse_sec_websocket_version_resp(<<"13, 8, 7">>)
  2381. ).
  2382. -endif.
  2383. %% @doc Parse the TE header.
  2384. %%
  2385. %% This function does not support parsing of transfer-parameter.
  2386. -spec parse_te(binary()) -> {trailers | no_trailers, [{binary(), qvalue()}]}.
  2387. parse_te(TE) ->
  2388. te_list(TE, no_trailers, []).
  2389. te_list(<<>>, Trail, Acc) -> {Trail, lists:reverse(Acc)};
  2390. te_list(<< C, R/bits >>, Trail, Acc) when ?IS_WS_COMMA(C) -> te_list(R, Trail, Acc);
  2391. te_list(<< "trailers", R/bits >>, Trail, Acc) -> te(R, Trail, Acc, <<"trailers">>);
  2392. te_list(<< "compress", R/bits >>, Trail, Acc) -> te(R, Trail, Acc, <<"compress">>);
  2393. te_list(<< "deflate", R/bits >>, Trail, Acc) -> te(R, Trail, Acc, <<"deflate">>);
  2394. te_list(<< "gzip", R/bits >>, Trail, Acc) -> te(R, Trail, Acc, <<"gzip">>);
  2395. te_list(<< C, R/bits >>, Trail, Acc) when ?IS_TOKEN(C) ->
  2396. ?LOWER(te, R, Trail, Acc, <<>>).
  2397. te(<<>>, _, Acc, <<"trailers">>) -> {trailers, lists:reverse(Acc)};
  2398. te(<< $,, R/bits >>, _, Acc, <<"trailers">>) -> te_list(R, trailers, Acc);
  2399. te(<< $;, R/bits >>, Trail, Acc, T) when T =/= <<"trailers">> -> te_before_weight(R, Trail, Acc, T);
  2400. te(<< C, R/bits >>, _, Acc, <<"trailers">>) when ?IS_WS(C) -> te_list_sep(R, trailers, Acc);
  2401. te(<< C, R/bits >>, Trail, Acc, T) when ?IS_TOKEN(C) ->
  2402. ?LOWER(te, R, Trail, Acc, T);
  2403. te(R, Trail, Acc, T) -> te_param_sep(R, Trail, Acc, T).
  2404. te_param_sep(<<>>, Trail, Acc, T) -> {Trail, lists:reverse([{T, 1000}|Acc])};
  2405. te_param_sep(<< $,, R/bits >>, Trail, Acc, T) -> te_list(R, Trail, [{T, 1000}|Acc]);
  2406. te_param_sep(<< C, R/bits >>, Trail, Acc, T) when ?IS_WS(C) -> te_param_sep(R, Trail, Acc, T).
  2407. te_before_weight(<< C, R/bits >>, Trail, Acc, T) when ?IS_WS(C) -> te_before_weight(R, Trail, Acc, T);
  2408. te_before_weight(<< $q, $=, R/bits >>, Trail, Acc, T) -> te_weight(R, Trail, Acc, T).
  2409. te_weight(<< "1.000", R/bits >>, Trail, Acc, T) -> te_list_sep(R, Trail, [{T, 1000}|Acc]);
  2410. te_weight(<< "1.00", R/bits >>, Trail, Acc, T) -> te_list_sep(R, Trail, [{T, 1000}|Acc]);
  2411. te_weight(<< "1.0", R/bits >>, Trail, Acc, T) -> te_list_sep(R, Trail, [{T, 1000}|Acc]);
  2412. te_weight(<< "1.", R/bits >>, Trail, Acc, T) -> te_list_sep(R, Trail, [{T, 1000}|Acc]);
  2413. te_weight(<< "1", R/bits >>, Trail, Acc, T) -> te_list_sep(R, Trail, [{T, 1000}|Acc]);
  2414. te_weight(<< "0.", A, B, C, R/bits >>, Trail, Acc, T) when ?IS_DIGIT(A), ?IS_DIGIT(B), ?IS_DIGIT(C) ->
  2415. te_list_sep(R, Trail, [{T, (A - $0) * 100 + (B - $0) * 10 + (C - $0)}|Acc]);
  2416. te_weight(<< "0.", A, B, R/bits >>, Trail, Acc, T) when ?IS_DIGIT(A), ?IS_DIGIT(B) ->
  2417. te_list_sep(R, Trail, [{T, (A - $0) * 100 + (B - $0) * 10}|Acc]);
  2418. te_weight(<< "0.", A, R/bits >>, Trail, Acc, T) when ?IS_DIGIT(A) ->
  2419. te_list_sep(R, Trail, [{T, (A - $0) * 100}|Acc]);
  2420. te_weight(<< "0.", R/bits >>, Trail, Acc, T) -> te_list_sep(R, Trail, [{T, 0}|Acc]);
  2421. te_weight(<< "0", R/bits >>, Trail, Acc, T) -> te_list_sep(R, Trail, [{T, 0}|Acc]).
  2422. te_list_sep(<<>>, Trail, Acc) -> {Trail, lists:reverse(Acc)};
  2423. te_list_sep(<< C, R/bits >>, Trail, Acc) when ?IS_WS(C) -> te_list_sep(R, Trail, Acc);
  2424. te_list_sep(<< $,, R/bits >>, Trail, Acc) -> te_list(R, Trail, Acc).
  2425. -ifdef(TEST).
  2426. te() ->
  2427. ?LET({Trail, L},
  2428. {elements([trailers, no_trailers]),
  2429. small_non_empty_list({?SUCHTHAT(T, token(), T =/= <<"trailers">>), weight()})},
  2430. {Trail, L, begin
  2431. L2 = case Trail of
  2432. no_trailers -> L;
  2433. trailers ->
  2434. Rand = random:uniform(length(L) + 1) - 1,
  2435. {Before, After} = lists:split(Rand, L),
  2436. Before ++ [{<<"trailers">>, undefined}|After]
  2437. end,
  2438. << _, TE/binary >> = iolist_to_binary([case W of
  2439. undefined -> [$,, T];
  2440. _ -> [$,, T, <<";q=">>, qvalue_to_iodata(W)]
  2441. end || {T, W} <- L2]),
  2442. TE
  2443. end}
  2444. ).
  2445. prop_parse_te() ->
  2446. random:seed(os:timestamp()),
  2447. ?FORALL({Trail, L, TE},
  2448. te(),
  2449. begin
  2450. {ResTrail, ResL} = parse_te(TE),
  2451. CheckedL = [begin
  2452. ResT =:= ?LOWER(T)
  2453. andalso (ResW =:= W orelse (W =:= undefined andalso ResW =:= 1000))
  2454. end || {{T, W}, {ResT, ResW}} <- lists:zip(L, ResL)],
  2455. ResTrail =:= Trail andalso [true] =:= lists:usort(CheckedL)
  2456. end).
  2457. parse_te_test_() ->
  2458. Tests = [
  2459. {<<"deflate">>, {no_trailers, [{<<"deflate">>, 1000}]}},
  2460. {<<>>, {no_trailers, []}},
  2461. {<<"trailers, deflate;q=0.5">>, {trailers, [{<<"deflate">>, 500}]}}
  2462. ],
  2463. [{V, fun() -> R = parse_te(V) end} || {V, R} <- Tests].
  2464. horse_parse_te() ->
  2465. horse:repeat(200000,
  2466. parse_te(<<"trailers, deflate;q=0.5">>)
  2467. ).
  2468. -endif.
  2469. %% @doc Parse the Trailer header.
  2470. -spec parse_trailer(binary()) -> [binary()].
  2471. parse_trailer(Trailer) ->
  2472. nonempty(token_ci_list(Trailer, [])).
  2473. -ifdef(TEST).
  2474. parse_trailer_test_() ->
  2475. Tests = [
  2476. {<<"Date, Content-MD5">>, [<<"date">>, <<"content-md5">>]}
  2477. ],
  2478. [{V, fun() -> R = parse_trailer(V) end} || {V, R} <- Tests].
  2479. parse_trailer_error_test_() ->
  2480. Tests = [
  2481. <<>>
  2482. ],
  2483. [{V, fun() -> {'EXIT', _} = (catch parse_trailer(V)) end} || V <- Tests].
  2484. horse_parse_trailer() ->
  2485. horse:repeat(200000,
  2486. parse_trailer(<<"Date, Content-MD5">>)
  2487. ).
  2488. -endif.
  2489. %% @doc Parse the Transfer-Encoding header.
  2490. %%
  2491. %% This function does not support parsing of transfer-parameter.
  2492. -spec parse_transfer_encoding(binary()) -> [binary()].
  2493. parse_transfer_encoding(<<"chunked">>) ->
  2494. [<<"chunked">>];
  2495. parse_transfer_encoding(TransferEncoding) ->
  2496. nonempty(token_ci_list(TransferEncoding, [])).
  2497. -ifdef(TEST).
  2498. prop_parse_transfer_encoding() ->
  2499. ?FORALL(L,
  2500. non_empty(list(token())),
  2501. begin
  2502. << _, TransferEncoding/binary >> = iolist_to_binary([[$,, C] || C <- L]),
  2503. ResL = parse_transfer_encoding(TransferEncoding),
  2504. CheckedL = [?LOWER(Co) =:= ResC || {Co, ResC} <- lists:zip(L, ResL)],
  2505. [true] =:= lists:usort(CheckedL)
  2506. end).
  2507. parse_transfer_encoding_test_() ->
  2508. Tests = [
  2509. {<<"a , , , ">>, [<<"a">>]},
  2510. {<<" , , , a">>, [<<"a">>]},
  2511. {<<"a , , b">>, [<<"a">>, <<"b">>]},
  2512. {<<"chunked">>, [<<"chunked">>]},
  2513. {<<"chunked, something">>, [<<"chunked">>, <<"something">>]},
  2514. {<<"gzip, chunked">>, [<<"gzip">>, <<"chunked">>]}
  2515. ],
  2516. [{V, fun() -> R = parse_transfer_encoding(V) end} || {V, R} <- Tests].
  2517. parse_transfer_encoding_error_test_() ->
  2518. Tests = [
  2519. <<>>,
  2520. <<" ">>,
  2521. <<" , ">>,
  2522. <<",,,">>,
  2523. <<"a b">>
  2524. ],
  2525. [{V, fun() -> {'EXIT', _} = (catch parse_transfer_encoding(V)) end}
  2526. || V <- Tests].
  2527. horse_parse_transfer_encoding_chunked() ->
  2528. horse:repeat(200000,
  2529. parse_transfer_encoding(<<"chunked">>)
  2530. ).
  2531. horse_parse_transfer_encoding_custom() ->
  2532. horse:repeat(200000,
  2533. parse_transfer_encoding(<<"chunked, something">>)
  2534. ).
  2535. -endif.
  2536. %% @doc Parse the Upgrade header.
  2537. %%
  2538. %% It is unclear from the RFC whether the values here are
  2539. %% case sensitive.
  2540. %%
  2541. %% We handle them in a case insensitive manner because they
  2542. %% are described as case insensitive in the Websocket RFC.
  2543. -spec parse_upgrade(binary()) -> [binary()].
  2544. parse_upgrade(Upgrade) ->
  2545. nonempty(protocol_list(Upgrade, [])).
  2546. protocol_list(<<>>, Acc) -> lists:reverse(Acc);
  2547. protocol_list(<< C, R/bits >>, Acc) when ?IS_WS_COMMA(C) -> protocol_list(R, Acc);
  2548. protocol_list(<< C, R/bits >>, Acc) when ?IS_TOKEN(C) ->
  2549. ?LOWER(protocol_name, R, Acc, <<>>).
  2550. protocol_name(<< $/, C, R/bits >>, Acc, P) ->
  2551. ?LOWER(protocol_version, R, Acc, << P/binary, $/ >>);
  2552. protocol_name(<< C, R/bits >>, Acc, P) when ?IS_TOKEN(C) ->
  2553. ?LOWER(protocol_name, R, Acc, P);
  2554. protocol_name(R, Acc, P) -> protocol_list_sep(R, [P|Acc]).
  2555. protocol_version(<< C, R/bits >>, Acc, P) when ?IS_TOKEN(C) ->
  2556. ?LOWER(protocol_version, R, Acc, P);
  2557. protocol_version(R, Acc, P) -> protocol_list_sep(R, [P|Acc]).
  2558. protocol_list_sep(<<>>, Acc) -> lists:reverse(Acc);
  2559. protocol_list_sep(<< C, R/bits >>, Acc) when ?IS_WS(C) -> protocol_list_sep(R, Acc);
  2560. protocol_list_sep(<< $,, R/bits >>, Acc) -> protocol_list(R, Acc).
  2561. -ifdef(TEST).
  2562. protocols() ->
  2563. ?LET(P,
  2564. oneof([token(), [token(), $/, token()]]),
  2565. iolist_to_binary(P)).
  2566. prop_parse_upgrade() ->
  2567. ?FORALL(L,
  2568. non_empty(list(protocols())),
  2569. begin
  2570. << _, Upgrade/binary >> = iolist_to_binary([[$,, P] || P <- L]),
  2571. ResL = parse_upgrade(Upgrade),
  2572. CheckedL = [?LOWER(P) =:= ResP || {P, ResP} <- lists:zip(L, ResL)],
  2573. [true] =:= lists:usort(CheckedL)
  2574. end).
  2575. parse_upgrade_test_() ->
  2576. Tests = [
  2577. {<<"HTTP/2.0, SHTTP/1.3, IRC/6.9, RTA/x11">>,
  2578. [<<"http/2.0">>, <<"shttp/1.3">>, <<"irc/6.9">>, <<"rta/x11">>]},
  2579. {<<"HTTP/2.0">>, [<<"http/2.0">>]}
  2580. ],
  2581. [{V, fun() -> R = parse_upgrade(V) end} || {V, R} <- Tests].
  2582. parse_upgrade_error_test_() ->
  2583. Tests = [
  2584. <<>>
  2585. ],
  2586. [{V, fun() -> {'EXIT', _} = (catch parse_upgrade(V)) end}
  2587. || V <- Tests].
  2588. -endif.
  2589. %% @doc Parse the Vary header.
  2590. -spec parse_vary(binary()) -> '*' | [binary()].
  2591. parse_vary(<<"*">>) ->
  2592. '*';
  2593. parse_vary(Vary) ->
  2594. nonempty(token_ci_list(Vary, [])).
  2595. -ifdef(TEST).
  2596. parse_vary_test_() ->
  2597. Tests = [
  2598. {<<"*">>, '*'},
  2599. {<<"Accept-Encoding">>, [<<"accept-encoding">>]},
  2600. {<<"accept-encoding, accept-language">>, [<<"accept-encoding">>, <<"accept-language">>]}
  2601. ],
  2602. [{V, fun() -> R = parse_vary(V) end} || {V, R} <- Tests].
  2603. parse_vary_error_test_() ->
  2604. Tests = [
  2605. <<>>
  2606. ],
  2607. [{V, fun() -> {'EXIT', _} = (catch parse_vary(V)) end} || V <- Tests].
  2608. -endif.
  2609. %% @doc Parse the WWW-Authenticate header.
  2610. %%
  2611. %% Unknown schemes are represented as the lowercase binary
  2612. %% instead of an atom. Unlike with parse_authorization/1,
  2613. %% we do not crash on unknown schemes.
  2614. %%
  2615. %% When parsing auth-params, we do not accept BWS characters around the "=".
  2616. -spec parse_www_authenticate(binary()) -> [{basic, binary()}
  2617. | {bearer | digest | binary(), [{binary(), binary()}]}].
  2618. parse_www_authenticate(Authenticate) ->
  2619. nonempty(www_auth_list(Authenticate, [])).
  2620. www_auth_list(<<>>, Acc) -> lists:reverse(Acc);
  2621. www_auth_list(<< C, R/bits >>, Acc) when ?IS_WS_COMMA(C) -> www_auth_list(R, Acc);
  2622. www_auth_list(<< C, R/bits >>, Acc) when ?IS_TOKEN(C) ->
  2623. ?LOWER(www_auth_scheme, R, Acc, <<>>).
  2624. www_auth_basic_before_realm(<< C, R/bits >>, Acc) when ?IS_WS(C) -> www_auth_basic_before_realm(R, Acc);
  2625. www_auth_basic_before_realm(<< "realm=\"", R/bits >>, Acc) -> www_auth_basic(R, Acc, <<>>).
  2626. www_auth_basic(<< $", R/bits >>, Acc, Realm) -> www_auth_list_sep(R, [{basic, Realm}|Acc]);
  2627. www_auth_basic(<< $\\, C, R/bits >>, Acc, Realm) when ?IS_VCHAR_OBS(C) -> www_auth_basic(R, Acc, << Realm/binary, C >>);
  2628. www_auth_basic(<< C, R/bits >>, Acc, Realm) when ?IS_VCHAR_OBS(C) -> www_auth_basic(R, Acc, << Realm/binary, C >>).
  2629. www_auth_scheme(<< C, R/bits >>, Acc, Scheme) when ?IS_WS(C) ->
  2630. case Scheme of
  2631. <<"basic">> -> www_auth_basic_before_realm(R, Acc);
  2632. <<"bearer">> -> www_auth_params_list(R, Acc, bearer, []);
  2633. <<"digest">> -> www_auth_params_list(R, Acc, digest, []);
  2634. _ -> www_auth_params_list(R, Acc, Scheme, [])
  2635. end;
  2636. www_auth_scheme(<< C, R/bits >>, Acc, Scheme) when ?IS_TOKEN(C) ->
  2637. ?LOWER(www_auth_scheme, R, Acc, Scheme).
  2638. www_auth_list_sep(<<>>, Acc) -> lists:reverse(Acc);
  2639. www_auth_list_sep(<< C, R/bits >>, Acc) when ?IS_WS(C) -> www_auth_list_sep(R, Acc);
  2640. www_auth_list_sep(<< $,, R/bits >>, Acc) -> www_auth_list(R, Acc).
  2641. www_auth_params_list(<<>>, Acc, Scheme, Params) ->
  2642. lists:reverse([{Scheme, lists:reverse(nonempty(Params))}|Acc]);
  2643. www_auth_params_list(<< C, R/bits >>, Acc, Scheme, Params) when ?IS_WS_COMMA(C) ->
  2644. www_auth_params_list(R, Acc, Scheme, Params);
  2645. www_auth_params_list(<< "algorithm=", C, R/bits >>, Acc, Scheme, Params) when ?IS_TOKEN(C) ->
  2646. www_auth_token(R, Acc, Scheme, Params, <<"algorithm">>, << C >>);
  2647. www_auth_params_list(<< "domain=\"", R/bits >>, Acc, Scheme, Params) ->
  2648. www_auth_quoted(R, Acc, Scheme, Params, <<"domain">>, <<>>);
  2649. www_auth_params_list(<< "error=\"", R/bits >>, Acc, Scheme, Params) ->
  2650. www_auth_quoted(R, Acc, Scheme, Params, <<"error">>, <<>>);
  2651. www_auth_params_list(<< "error_description=\"", R/bits >>, Acc, Scheme, Params) ->
  2652. www_auth_quoted(R, Acc, Scheme, Params, <<"error_description">>, <<>>);
  2653. www_auth_params_list(<< "error_uri=\"", R/bits >>, Acc, Scheme, Params) ->
  2654. www_auth_quoted(R, Acc, Scheme, Params, <<"error_uri">>, <<>>);
  2655. www_auth_params_list(<< "nonce=\"", R/bits >>, Acc, Scheme, Params) ->
  2656. www_auth_quoted(R, Acc, Scheme, Params, <<"nonce">>, <<>>);
  2657. www_auth_params_list(<< "opaque=\"", R/bits >>, Acc, Scheme, Params) ->
  2658. www_auth_quoted(R, Acc, Scheme, Params, <<"opaque">>, <<>>);
  2659. www_auth_params_list(<< "qop=\"", R/bits >>, Acc, Scheme, Params) ->
  2660. www_auth_quoted(R, Acc, Scheme, Params, <<"qop">>, <<>>);
  2661. www_auth_params_list(<< "realm=\"", R/bits >>, Acc, Scheme, Params) ->
  2662. www_auth_quoted(R, Acc, Scheme, Params, <<"realm">>, <<>>);
  2663. www_auth_params_list(<< "scope=\"", R/bits >>, Acc, Scheme, Params) ->
  2664. www_auth_quoted(R, Acc, Scheme, Params, <<"scope">>, <<>>);
  2665. www_auth_params_list(<< "stale=false", R/bits >>, Acc, Scheme, Params) ->
  2666. www_auth_params_list_sep(R, Acc, Scheme, [{<<"stale">>, <<"false">>}|Params]);
  2667. www_auth_params_list(<< "stale=true", R/bits >>, Acc, Scheme, Params) ->
  2668. www_auth_params_list_sep(R, Acc, Scheme, [{<<"stale">>, <<"true">>}|Params]);
  2669. www_auth_params_list(<< C, R/bits >>, Acc, Scheme, Params) when ?IS_TOKEN(C) ->
  2670. ?LOWER(www_auth_param, R, Acc, Scheme, Params, <<>>).
  2671. www_auth_param(<< $=, $", R/bits >>, Acc, Scheme, Params, K) ->
  2672. www_auth_quoted(R, Acc, Scheme, Params, K, <<>>);
  2673. www_auth_param(<< $=, C, R/bits >>, Acc, Scheme, Params, K) when ?IS_TOKEN(C) ->
  2674. www_auth_token(R, Acc, Scheme, Params, K, << C >>);
  2675. www_auth_param(<< C, R/bits >>, Acc, Scheme, Params, K) when ?IS_TOKEN(C) ->
  2676. ?LOWER(www_auth_param, R, Acc, Scheme, Params, K);
  2677. www_auth_param(R, Acc, Scheme, Params, NewScheme) ->
  2678. www_auth_scheme(R, [{Scheme, lists:reverse(Params)}|Acc], NewScheme).
  2679. www_auth_token(<< C, R/bits >>, Acc, Scheme, Params, K, V) when ?IS_TOKEN(C) ->
  2680. www_auth_token(R, Acc, Scheme, Params, K, << V/binary, C >>);
  2681. www_auth_token(R, Acc, Scheme, Params, K, V) ->
  2682. www_auth_params_list_sep(R, Acc, Scheme, [{K, V}|Params]).
  2683. www_auth_quoted(<< $", R/bits >>, Acc, Scheme, Params, K, V) ->
  2684. www_auth_params_list_sep(R, Acc, Scheme, [{K, V}|Params]);
  2685. www_auth_quoted(<< $\\, C, R/bits >>, Acc, Scheme, Params, K, V) when ?IS_VCHAR_OBS(C) ->
  2686. www_auth_quoted(R, Acc, Scheme, Params, K, << V/binary, C >>);
  2687. www_auth_quoted(<< C, R/bits >>, Acc, Scheme, Params, K, V) when ?IS_VCHAR_OBS(C) ->
  2688. www_auth_quoted(R, Acc, Scheme, Params, K, << V/binary, C >>).
  2689. www_auth_params_list_sep(<<>>, Acc, Scheme, Params) ->
  2690. lists:reverse([{Scheme, lists:reverse(Params)}|Acc]);
  2691. www_auth_params_list_sep(<< C, R/bits >>, Acc, Scheme, Params) when ?IS_WS(C) ->
  2692. www_auth_params_list_sep(R, Acc, Scheme, Params);
  2693. www_auth_params_list_sep(<< $,, R/bits >>, Acc, Scheme, Params) ->
  2694. www_auth_params_list_after_sep(R, Acc, Scheme, Params).
  2695. www_auth_params_list_after_sep(<<>>, Acc, Scheme, Params) ->
  2696. lists:reverse([{Scheme, lists:reverse(Params)}|Acc]);
  2697. www_auth_params_list_after_sep(<< C, R/bits >>, Acc, Scheme, Params) when ?IS_WS_COMMA(C) ->
  2698. www_auth_params_list_after_sep(R, Acc, Scheme, Params);
  2699. www_auth_params_list_after_sep(R, Acc, Scheme, Params) ->
  2700. www_auth_params_list(R, Acc, Scheme, Params).
  2701. -ifdef(TEST).
  2702. parse_www_authenticate_test_() ->
  2703. Tests = [
  2704. {<<"Newauth realm=\"apps\", type=1, title=\"Login to \\\"apps\\\"\", Basic realm=\"simple\"">>,
  2705. [{<<"newauth">>, [
  2706. {<<"realm">>, <<"apps">>},
  2707. {<<"type">>, <<"1">>},
  2708. {<<"title">>, <<"Login to \"apps\"">>}]},
  2709. {basic, <<"simple">>}]},
  2710. %% Same test, different order.
  2711. {<<"Basic realm=\"simple\", Newauth realm=\"apps\", type=1, title=\"Login to \\\"apps\\\"\"">>,
  2712. [{basic, <<"simple">>},
  2713. {<<"newauth">>, [
  2714. {<<"realm">>, <<"apps">>},
  2715. {<<"type">>, <<"1">>},
  2716. {<<"title">>, <<"Login to \"apps\"">>}]}]},
  2717. {<<"Bearer realm=\"example\"">>,
  2718. [{bearer, [{<<"realm">>, <<"example">>}]}]},
  2719. {<<"Bearer realm=\"example\", error=\"invalid_token\", error_description=\"The access token expired\"">>,
  2720. [{bearer, [
  2721. {<<"realm">>, <<"example">>},
  2722. {<<"error">>, <<"invalid_token">>},
  2723. {<<"error_description">>, <<"The access token expired">>}
  2724. ]}]},
  2725. {<<"Basic realm=\"WallyWorld\"">>,
  2726. [{basic, <<"WallyWorld">>}]},
  2727. {<<"Digest realm=\"testrealm@host.com\", qop=\"auth,auth-int\", "
  2728. "nonce=\"dcd98b7102dd2f0e8b11d0f600bfb0c093\", "
  2729. "opaque=\"5ccc069c403ebaf9f0171e9517f40e41\"">>,
  2730. [{digest, [
  2731. {<<"realm">>, <<"testrealm@host.com">>},
  2732. {<<"qop">>, <<"auth,auth-int">>},
  2733. {<<"nonce">>, <<"dcd98b7102dd2f0e8b11d0f600bfb0c093">>},
  2734. {<<"opaque">>, <<"5ccc069c403ebaf9f0171e9517f40e41">>}
  2735. ]}]}
  2736. ],
  2737. [{V, fun() -> R = parse_www_authenticate(V) end} || {V, R} <- Tests].
  2738. parse_www_authenticate_error_test_() ->
  2739. Tests = [
  2740. <<>>
  2741. ],
  2742. [{V, fun() -> {'EXIT', _} = (catch parse_www_authenticate(V)) end} || V <- Tests].
  2743. horse_parse_www_authenticate() ->
  2744. horse:repeat(200000,
  2745. parse_www_authenticate(<<"Newauth realm=\"apps\", type=1, title=\"Login to \\\"apps\\\"\", Basic realm=\"simple\"">>)
  2746. ).
  2747. -endif.
  2748. %% @doc Parse the X-Forwarded-For header.
  2749. %%
  2750. %% This header has no specification but *looks like* it is
  2751. %% a list of tokens.
  2752. %%
  2753. %% This header is deprecated in favor of the Forwarded header.
  2754. -spec parse_x_forwarded_for(binary()) -> [binary()].
  2755. parse_x_forwarded_for(XForwardedFor) ->
  2756. nonempty(token_list(XForwardedFor, [])).
  2757. -ifdef(TEST).
  2758. parse_x_forwarded_for_test_() ->
  2759. Tests = [
  2760. {<<"client, proxy1, proxy2">>, [<<"client">>, <<"proxy1">>, <<"proxy2">>]},
  2761. {<<"128.138.243.150, unknown, 192.52.106.30">>, [<<"128.138.243.150">>, <<"unknown">>, <<"192.52.106.30">>]}
  2762. ],
  2763. [{V, fun() -> R = parse_x_forwarded_for(V) end} || {V, R} <- Tests].
  2764. parse_x_forwarded_for_error_test_() ->
  2765. Tests = [
  2766. <<>>
  2767. ],
  2768. [{V, fun() -> {'EXIT', _} = (catch parse_x_forwarded_for(V)) end} || V <- Tests].
  2769. -endif.
  2770. %% Building.
  2771. %% @doc Build the Access-Control-Allow-Credentials header.
  2772. -spec access_control_allow_credentials() -> iodata().
  2773. access_control_allow_credentials() -> <<"true">>.
  2774. %% @doc Build the Access-Control-Allow-Headers header.
  2775. -spec access_control_allow_headers([binary()]) -> iodata().
  2776. access_control_allow_headers(Headers) ->
  2777. join_token_list(nonempty(Headers)).
  2778. -ifdef(TEST).
  2779. access_control_allow_headers_test_() ->
  2780. Tests = [
  2781. {[<<"accept">>], <<"accept">>},
  2782. {[<<"accept">>, <<"authorization">>, <<"content-type">>], <<"accept, authorization, content-type">>}
  2783. ],
  2784. [{lists:flatten(io_lib:format("~p", [V])),
  2785. fun() -> R = iolist_to_binary(access_control_allow_headers(V)) end} || {V, R} <- Tests].
  2786. access_control_allow_headers_error_test_() ->
  2787. Tests = [
  2788. []
  2789. ],
  2790. [{lists:flatten(io_lib:format("~p", [V])),
  2791. fun() -> {'EXIT', _} = (catch access_control_allow_headers(V)) end} || V <- Tests].
  2792. horse_access_control_allow_headers() ->
  2793. horse:repeat(200000,
  2794. access_control_allow_headers([<<"accept">>, <<"authorization">>, <<"content-type">>])
  2795. ).
  2796. -endif.
  2797. %% @doc Build the Access-Control-Allow-Methods header.
  2798. -spec access_control_allow_methods([binary()]) -> iodata().
  2799. access_control_allow_methods(Methods) ->
  2800. join_token_list(nonempty(Methods)).
  2801. -ifdef(TEST).
  2802. access_control_allow_methods_test_() ->
  2803. Tests = [
  2804. {[<<"GET">>], <<"GET">>},
  2805. {[<<"GET">>, <<"POST">>, <<"DELETE">>], <<"GET, POST, DELETE">>}
  2806. ],
  2807. [{lists:flatten(io_lib:format("~p", [V])),
  2808. fun() -> R = iolist_to_binary(access_control_allow_methods(V)) end} || {V, R} <- Tests].
  2809. access_control_allow_methods_error_test_() ->
  2810. Tests = [
  2811. []
  2812. ],
  2813. [{lists:flatten(io_lib:format("~p", [V])),
  2814. fun() -> {'EXIT', _} = (catch access_control_allow_methods(V)) end} || V <- Tests].
  2815. horse_access_control_allow_methods() ->
  2816. horse:repeat(200000,
  2817. access_control_allow_methods([<<"GET">>, <<"POST">>, <<"DELETE">>])
  2818. ).
  2819. -endif.
  2820. %% @doc Build the Access-Control-Allow-Origin header.
  2821. -spec access_control_allow_origin({binary(), binary(), 0..65535} | reference() | '*') -> iodata().
  2822. access_control_allow_origin({Scheme, Host, Port}) ->
  2823. case default_port(Scheme) of
  2824. Port -> [Scheme, <<"://">>, Host];
  2825. _ -> [Scheme, <<"://">>, Host, <<":">>, integer_to_binary(Port)]
  2826. end;
  2827. access_control_allow_origin('*') -> <<$*>>;
  2828. access_control_allow_origin(Ref) when is_reference(Ref) -> <<"null">>.
  2829. -ifdef(TEST).
  2830. access_control_allow_origin_test_() ->
  2831. Tests = [
  2832. {{<<"http">>, <<"www.example.org">>, 8080}, <<"http://www.example.org:8080">>},
  2833. {{<<"http">>, <<"www.example.org">>, 80}, <<"http://www.example.org">>},
  2834. {{<<"http">>, <<"192.0.2.1">>, 8080}, <<"http://192.0.2.1:8080">>},
  2835. {{<<"http">>, <<"192.0.2.1">>, 80}, <<"http://192.0.2.1">>},
  2836. {{<<"http">>, <<"[2001:db8::1]">>, 8080}, <<"http://[2001:db8::1]:8080">>},
  2837. {{<<"http">>, <<"[2001:db8::1]">>, 80}, <<"http://[2001:db8::1]">>},
  2838. {{<<"http">>, <<"[::ffff:192.0.2.1]">>, 8080}, <<"http://[::ffff:192.0.2.1]:8080">>},
  2839. {{<<"http">>, <<"[::ffff:192.0.2.1]">>, 80}, <<"http://[::ffff:192.0.2.1]">>},
  2840. {make_ref(), <<"null">>},
  2841. {'*', <<$*>>}
  2842. ],
  2843. [{lists:flatten(io_lib:format("~p", [V])),
  2844. fun() -> R = iolist_to_binary(access_control_allow_origin(V)) end} || {V, R} <- Tests].
  2845. horse_access_control_allow_origin() ->
  2846. horse:repeat(200000,
  2847. access_control_allow_origin({<<"http">>, <<"example.org">>, 8080})
  2848. ).
  2849. -endif.
  2850. %% @doc Build the Access-Control-Expose-Headers header.
  2851. -spec access_control_expose_headers([binary()]) -> iodata().
  2852. access_control_expose_headers(Headers) ->
  2853. join_token_list(nonempty(Headers)).
  2854. -ifdef(TEST).
  2855. access_control_expose_headers_test_() ->
  2856. Tests = [
  2857. {[<<"accept">>], <<"accept">>},
  2858. {[<<"accept">>, <<"authorization">>, <<"content-type">>], <<"accept, authorization, content-type">>}
  2859. ],
  2860. [{lists:flatten(io_lib:format("~p", [V])),
  2861. fun() -> R = iolist_to_binary(access_control_expose_headers(V)) end} || {V, R} <- Tests].
  2862. access_control_expose_headers_error_test_() ->
  2863. Tests = [
  2864. []
  2865. ],
  2866. [{lists:flatten(io_lib:format("~p", [V])),
  2867. fun() -> {'EXIT', _} = (catch access_control_expose_headers(V)) end} || V <- Tests].
  2868. horse_access_control_expose_headers() ->
  2869. horse:repeat(200000,
  2870. access_control_expose_headers([<<"accept">>, <<"authorization">>, <<"content-type">>])
  2871. ).
  2872. -endif.
  2873. %% @doc Build the Access-Control-Max-Age header.
  2874. -spec access_control_max_age(non_neg_integer()) -> iodata().
  2875. access_control_max_age(MaxAge) -> integer_to_binary(MaxAge).
  2876. -ifdef(TEST).
  2877. access_control_max_age_test_() ->
  2878. Tests = [
  2879. {0, <<"0">>},
  2880. {42, <<"42">>},
  2881. {69, <<"69">>},
  2882. {1337, <<"1337">>},
  2883. {3495, <<"3495">>},
  2884. {1234567890, <<"1234567890">>}
  2885. ],
  2886. [{V, fun() -> R = access_control_max_age(V) end} || {V, R} <- Tests].
  2887. -endif.
  2888. %% Internal.
  2889. %% Only return if the list is not empty.
  2890. nonempty(L) when L =/= [] -> L.
  2891. %% Parse a list of case sensitive tokens.
  2892. token_list(<<>>, Acc) -> lists:reverse(Acc);
  2893. token_list(<< C, R/bits >>, Acc) when ?IS_WS_COMMA(C) -> token_list(R, Acc);
  2894. token_list(<< C, R/bits >>, Acc) when ?IS_TOKEN(C) -> token(R, Acc, << C >>).
  2895. token(<< C, R/bits >>, Acc, T) when ?IS_TOKEN(C) -> token(R, Acc, << T/binary, C >>);
  2896. token(R, Acc, T) -> token_list_sep(R, [T|Acc]).
  2897. token_list_sep(<<>>, Acc) -> lists:reverse(Acc);
  2898. token_list_sep(<< C, R/bits >>, Acc) when ?IS_WS(C) -> token_list_sep(R, Acc);
  2899. token_list_sep(<< $,, R/bits >>, Acc) -> token_list(R, Acc).
  2900. %% Parse a list of case insensitive tokens.
  2901. token_ci_list(<<>>, Acc) -> lists:reverse(Acc);
  2902. token_ci_list(<< C, R/bits >>, Acc) when ?IS_WS_COMMA(C) -> token_ci_list(R, Acc);
  2903. token_ci_list(<< C, R/bits >>, Acc) when ?IS_TOKEN(C) -> ?LOWER(token_ci, R, Acc, <<>>).
  2904. token_ci(<< C, R/bits >>, Acc, T) when ?IS_TOKEN(C) -> ?LOWER(token_ci, R, Acc, T);
  2905. token_ci(R, Acc, T) -> token_ci_list_sep(R, [T|Acc]).
  2906. token_ci_list_sep(<<>>, Acc) -> lists:reverse(Acc);
  2907. token_ci_list_sep(<< C, R/bits >>, Acc) when ?IS_WS(C) -> token_ci_list_sep(R, Acc);
  2908. token_ci_list_sep(<< $,, R/bits >>, Acc) -> token_ci_list(R, Acc).
  2909. join_token_list([]) -> [];
  2910. join_token_list([H|T]) -> join_token_list(T, [H]).
  2911. join_token_list([], Acc) -> lists:reverse(Acc);
  2912. join_token_list([H|T], Acc) -> join_token_list(T, [H,<<", ">>|Acc]).