src/couch_replicator/src/couch_replicator_httpc.erl - couchdb - Git at Google

 % Licensed under the Apache License, Version 2.0 (the "License"); you may not
 % use this file except in compliance with the License. You may obtain a copy of
 % the License at
 %
 %   http://www.apache.org/licenses/LICENSE-2.0
 %
 % Unless required by applicable law or agreed to in writing, software
 % distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
 % WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
 % License for the specific language governing permissions and limitations under
 % the License.

 -module(couch_replicator_httpc).

 -include_lib("couch/include/couch_db.hrl").
 -include_lib("ibrowse/include/ibrowse.hrl").
 -include_lib("couch_replicator/include/couch_replicator_api_wrap.hrl").

 -export([setup/1]).
 -export([send_req/3]).
 -export([stop_http_worker/0]).
 -export([full_url/2]).

 -import(couch_util, [
     get_value/2,
     get_value/3
 ]).

 -define(replace(L, K, V), lists:keystore(K, 1, L, {K, V})).
 -define(MAX_WAIT, 5 * 60 * 1000).
 -define(STREAM_STATUS, ibrowse_stream_status).
 -define(STOP_HTTP_WORKER, stop_http_worker).

 % This limit is for the number of messages we're willing to discard
 % from an HTTP stream in clean_mailbox/1 before killing the worker
 % and returning. The original intent for clean_mailbox was to remove
 % a single message or two if the changes feed returned before fully
 % consuming the request. This threshold gives us confidence we'll
 % continue to properly close changes feeds while avoiding any case
 % where we may end up processing an unbounded number of messages.
 -define(MAX_DISCARDED_MESSAGES, 16).

 setup(Db) ->
     #httpdb{
         httpc_pool = nil,
         url = Url,
         http_connections = MaxConns,
         proxy_url = ProxyUrl
     } = Db,
     {ok, Pid} = couch_replicator_httpc_pool:start_link(
         Url,
         ProxyUrl,
         [{max_connections, MaxConns}]
     ),
     case couch_replicator_auth:initialize(Db#httpdb{httpc_pool = Pid}) of
         {ok, Db1} ->
             {ok, Db1};
         {error, Error} ->
             LogMsg = "~p: auth plugin initialization failed ~p ~p",
             LogUrl = couch_util:url_strip_password(Url),
             couch_log:error(LogMsg, [?MODULE, LogUrl, Error]),
             throw({replication_auth_error, Error})
     end.

 send_req(HttpDb, Params1, Callback) ->
     put(?STREAM_STATUS, init),
     couch_stats:increment_counter([couch_replicator, requests]),
     Params2 = ?replace(
         Params1,
         qs,
         [{K, ?b2l(iolist_to_binary(V))} || {K, V} <- get_value(qs, Params1, [])]
     ),
     Params = ?replace(
         Params2,
         ibrowse_options,
         lists:keysort(1, get_value(ibrowse_options, Params2, []))
     ),
     {Worker, Response, HttpDb1} = send_ibrowse_req(HttpDb, Params),
     Ret =
         try
             process_response(Response, Worker, HttpDb1, Params, Callback)
         catch
             throw:{retry, NewHttpDb0, NewParams0} ->
                 {retry, NewHttpDb0, NewParams0}
         after
             Pool = HttpDb1#httpdb.httpc_pool,
             case get(?STOP_HTTP_WORKER) of
                 stop ->
                     ok = stop_and_release_worker(Pool, Worker),
                     erase(?STOP_HTTP_WORKER);
                 undefined ->
                     ok = couch_replicator_httpc_pool:release_worker(Pool, Worker)
             end,
             clean_mailbox(Response)
         end,
     % This is necessary to keep this tail-recursive. Calling
     % send_req in the catch clause would turn it into a body
     % recursive call accidentally.
     case Ret of
         {retry, #httpdb{} = NewHttpDb, NewParams} ->
             send_req(NewHttpDb, NewParams, Callback);
         _ ->
             Ret
     end.

 stop_http_worker() ->
     put(?STOP_HTTP_WORKER, stop).

 send_ibrowse_req(#httpdb{headers = BaseHeaders} = HttpDb0, Params) ->
     Method = get_value(method, Params, get),
     UserHeaders = get_value(headers, Params, []),
     Headers1 = merge_headers(BaseHeaders, UserHeaders),
     {Headers2, HttpDb} = couch_replicator_auth:update_headers(HttpDb0, Headers1),
     Url = full_url(HttpDb, Params),
     Body = get_value(body, Params, []),
     case get_value(path, Params) == "_changes" of
         true ->
             Timeout = infinity;
         false ->
             Timeout =
                 case config:get("replicator", "request_timeout", "infinity") of
                     "infinity" -> infinity;
                     Milliseconds -> list_to_integer(Milliseconds)
                 end
     end,
     {ok, Worker} = couch_replicator_httpc_pool:get_worker(HttpDb#httpdb.httpc_pool),
     BasicAuthOpts =
         case couch_replicator_utils:get_basic_auth_creds(HttpDb) of
             {undefined, undefined} ->
                 [];
             {User, Pass} when is_list(User), is_list(Pass) ->
                 [{basic_auth, {User, Pass}}]
         end,
     IbrowseOptions =
         BasicAuthOpts ++
             [
                 {response_format, binary},
                 {inactivity_timeout, HttpDb#httpdb.timeout}
                 | lists:ukeymerge(
                     1,
                     get_value(ibrowse_options, Params, []),
                     HttpDb#httpdb.ibrowse_options
                 )
             ],
     backoff_before_request(Worker, HttpDb, Params),
     Response = ibrowse:send_req_direct(
         Worker, Url, Headers2, Method, Body, IbrowseOptions, Timeout
     ),
     {Worker, Response, HttpDb}.

 %% Stop worker, wait for it to die, then release it. Make sure it is dead before
 %% releasing it to the pool, so there is not race triggered recycling it again.
 %% The reason is recycling a dying worker, could end up that worker returning
 %% {error, req_timedout} error. While in reality is not really a timeout, just
 %% a race condition.
 stop_and_release_worker(Pool, Worker) ->
     Ref = erlang:monitor(process, Worker),
     ibrowse_http_client:stop(Worker),
     receive
         {'DOWN', Ref, _, _, _} ->
             ok
     end,
     ok = couch_replicator_httpc_pool:release_worker_sync(Pool, Worker).

 process_response({error, sel_conn_closed}, Worker, HttpDb, Params, _Cb) ->
     put(?STOP_HTTP_WORKER, stop),
     maybe_retry(sel_conn_closed, Worker, HttpDb, Params);
 %% This clause handles un-expected connection closing during pipelined requests.
 %% For example, if server responds to a request, sets Connection: close header
 %% and closes the socket, ibrowse will detect that error when it sends
 %% next request.
 process_response({error, connection_closing}, Worker, HttpDb, Params, _Cb) ->
     put(?STOP_HTTP_WORKER, stop),
     maybe_retry({error, connection_closing}, Worker, HttpDb, Params);
 process_response({ibrowse_req_id, ReqId}, Worker, HttpDb, Params, Callback) ->
     process_stream_response(ReqId, Worker, HttpDb, Params, Callback);
 process_response({ok, Code, Headers, Body}, Worker, HttpDb, Params, Callback) ->
     case list_to_integer(Code) of
         R when R =:= 301; R =:= 302; R =:= 303 ->
             backoff_success(HttpDb, Params),
             do_redirect(Worker, R, Headers, HttpDb, Params, Callback);
         429 ->
             backoff(HttpDb, Params);
         Error when Error =:= 408; Error >= 500 ->
             couch_stats:increment_counter([couch_replicator, responses, failure]),
             maybe_retry({code, Error}, Worker, HttpDb, Params);
         Ok when Ok >= 200, Ok < 500 ->
             backoff_success(HttpDb, Params),
             couch_stats:increment_counter([couch_replicator, responses, success]),
             EJson =
                 case Body of
                     <<>> ->
                         null;
                     Json ->
                         ?JSON_DECODE(Json)
                 end,
             process_auth_response(HttpDb, Ok, Headers, Params),
             if
                 Ok =:= 413 -> put(?STOP_HTTP_WORKER, stop);
                 true -> ok
             end,
             Callback(Ok, Headers, EJson)
     end;
 process_response(Error, Worker, HttpDb, Params, _Callback) ->
     maybe_retry(Error, Worker, HttpDb, Params).

 process_stream_response(ReqId, Worker, HttpDb, Params, Callback) ->
     receive
         {ibrowse_async_headers, ReqId, Code, Headers} ->
             case list_to_integer(Code) of
                 R when R =:= 301; R =:= 302; R =:= 303 ->
                     backoff_success(HttpDb, Params),
                     do_redirect(Worker, R, Headers, HttpDb, Params, Callback);
                 429 ->
                     Timeout = couch_replicator_rate_limiter:max_interval(),
                     backoff(HttpDb#httpdb{timeout = Timeout}, Params);
                 Error when Error =:= 408; Error >= 500 ->
                     couch_stats:increment_counter(
                         [couch_replicator, stream_responses, failure]
                     ),
                     report_error(Worker, HttpDb, Params, {code, Error});
                 Ok when Ok >= 200, Ok < 500 ->
                     backoff_success(HttpDb, Params),
                     HttpDb1 = process_auth_response(HttpDb, Ok, Headers, Params),
                     StreamDataFun = fun() ->
                         stream_data_self(HttpDb1, Params, Worker, ReqId, Callback)
                     end,
                     put(?STREAM_STATUS, {streaming, Worker}),
                     if
                         Ok =:= 413 -> put(?STOP_HTTP_WORKER, stop);
                         true -> ok
                     end,
                     ibrowse:stream_next(ReqId),
                     try
                         Ret = Callback(Ok, Headers, StreamDataFun),
                         Ret
                     catch
                         throw:{maybe_retry_req, connection_closed} ->
                             maybe_retry(
                                 {connection_closed, mid_stream},
                                 Worker,
                                 HttpDb1,
                                 Params
                             );
                         throw:{maybe_retry_req, Err} ->
                             maybe_retry(Err, Worker, HttpDb1, Params)
                     end
             end;
         {ibrowse_async_response, ReqId, {error, _} = Error} ->
             couch_stats:increment_counter(
                 [couch_replicator, stream_responses, failure]
             ),
             maybe_retry(Error, Worker, HttpDb, Params)
     after HttpDb#httpdb.timeout + 500 ->
         % Note: ibrowse should always reply with timeouts, but this doesn't
         % seem to be always true when there's a very high rate of requests
         % and many open connections.
         maybe_retry(timeout, Worker, HttpDb, Params)
     end.

 process_auth_response(HttpDb, Code, Headers, Params) ->
     case couch_replicator_auth:handle_response(HttpDb, Code, Headers) of
         {continue, HttpDb1} ->
             HttpDb1;
         {retry, HttpDb1} ->
             log_retry_error(Params, HttpDb1, 0, Code),
             throw({retry, HttpDb1, Params})
     end.

 % Only streaming HTTP requests send messages back from
 % the ibrowse worker process. We can detect that based
 % on the ibrowse_req_id format. This just drops all
 % messages for the given ReqId on the floor since we're
 % no longer in the HTTP request.

 clean_mailbox(ReqId) ->
     clean_mailbox(ReqId, ?MAX_DISCARDED_MESSAGES).

 clean_mailbox(_ReqId, 0) ->
     case get(?STREAM_STATUS) of
         {streaming, Worker} ->
             % We kill workers that continue to stream us
             % messages after we give up but do *not* exit
             % our selves. This is because we may be running
             % as an exception unwinds and we don't want to
             % change any of that subtle logic.
             exit(Worker, {timeout, ibrowse_stream_cleanup});
         _ ->
             ok
     end,
     ok;
 clean_mailbox({ibrowse_req_id, ReqId}, Count) when Count > 0 ->
     case get(?STREAM_STATUS) of
         {streaming, Worker} ->
             case is_process_alive(Worker) of
                 true ->
                     discard_message(ReqId, Worker, Count);
                 false ->
                     put(?STREAM_STATUS, ended),
                     ok
             end;
         Status when Status == init; Status == ended ->
             receive
                 {ibrowse_async_response, ReqId, _} ->
                     clean_mailbox({ibrowse_req_id, ReqId}, Count - 1);
                 {ibrowse_async_response_end, ReqId} ->
                     put(?STREAM_STATUS, ended),
                     ok
             after 0 ->
                 ok
             end
     end;
 clean_mailbox(_, Count) when Count > 0 ->
     ok.

 discard_message(ReqId, Worker, Count) ->
     ibrowse:stream_next(ReqId),
     receive
         {ibrowse_async_response, ReqId, _} ->
             clean_mailbox({ibrowse_req_id, ReqId}, Count - 1);
         {ibrowse_async_response_end, ReqId} ->
             put(?STREAM_STATUS, ended),
             ok
     after 30000 ->
         exit(Worker, {timeout, ibrowse_stream_cleanup}),
         exit({timeout, ibrowse_stream_cleanup})
     end.

 -spec maybe_retry(any(), pid(), #httpdb{}, list()) -> no_return().
 maybe_retry(Error, Worker, #httpdb{retries = 0} = HttpDb, Params) ->
     report_error(Worker, HttpDb, Params, {error, Error});
 maybe_retry(
     Error,
     Worker,
     #httpdb{retries = Retries, wait = Wait} = HttpDb,
     Params
 ) ->
     case total_error_time_exceeded(HttpDb) of
         true ->
             report_error(Worker, HttpDb, Params, {error, Error});
         false ->
             ok = timer:sleep(Wait),
             log_retry_error(Params, HttpDb, Wait, Error),
             Wait2 = erlang:min(Wait * 2, ?MAX_WAIT),
             HttpDb1 = HttpDb#httpdb{retries = Retries - 1, wait = Wait2},
             HttpDb2 = update_first_error_timestamp(HttpDb1),
             throw({retry, HttpDb2, Params})
     end.

 % When retrying, check to make total time spent retrying a request is below
 % the current scheduler health threshold. The goal is to not exceed the
 % threshold, otherwise the job which keep retrying too long will still be
 % considered healthy.
 total_error_time_exceeded(#httpdb{first_error_timestamp = nil}) ->
     false;
 total_error_time_exceeded(#httpdb{first_error_timestamp = ErrorTimestamp}) ->
     HealthThresholdSec = couch_replicator_scheduler:health_threshold(),
     % Threshold value is halved because in the calling code the next step
     % is a doubling. Not halving here could mean sleeping too long and
     % exceeding the health threshold.
     ThresholdUSec = (HealthThresholdSec / 2) * 1000000,
     timer:now_diff(os:timestamp(), ErrorTimestamp) > ThresholdUSec.

 % Remember the first time an error occurs. This value is used later to check
 % the total time spend retrying a request. Because retrying is cursive, on
 % successful result #httpdb{} record is reset back to the original value.
 update_first_error_timestamp(#httpdb{first_error_timestamp = nil} = HttpDb) ->
     HttpDb#httpdb{first_error_timestamp = os:timestamp()};
 update_first_error_timestamp(HttpDb) ->
     HttpDb.

 log_retry_error(Params, HttpDb, Wait, Error) ->
     Method = string:to_upper(atom_to_list(get_value(method, Params, get))),
     Url = couch_util:url_strip_password(full_url(HttpDb, Params)),
     couch_log:notice(
         "Retrying ~s request to ~s in ~p seconds due to error ~s",
         [Method, Url, Wait / 1000, error_cause(Error)]
     ).

 report_error(_Worker, HttpDb, Params, Error) ->
     Method = string:to_upper(atom_to_list(get_value(method, Params, get))),
     Url = couch_util:url_strip_password(full_url(HttpDb, Params)),
     do_report_error(Url, Method, Error),
     exit({http_request_failed, Method, Url, Error}).

 do_report_error(Url, Method, {code, Code}) ->
     couch_log:error(
         "Replicator, request ~s to ~p failed. The received "
         "HTTP error code is ~p",
         [Method, Url, Code]
     );
 do_report_error(FullUrl, Method, Error) ->
     couch_log:error(
         "Replicator, request ~s to ~p failed due to error ~s",
         [Method, FullUrl, error_cause(Error)]
     ).

 error_cause({error, Cause}) ->
     lists:flatten(io_lib:format("~p", [Cause]));
 error_cause(Cause) ->
     lists:flatten(io_lib:format("~p", [Cause])).

 stream_data_self(#httpdb{timeout = T} = HttpDb, Params, Worker, ReqId, Cb) ->
     case accumulate_messages(ReqId, [], T + 500) of
         {Data, ibrowse_async_response} ->
             ibrowse:stream_next(ReqId),
             {Data, fun() -> stream_data_self(HttpDb, Params, Worker, ReqId, Cb) end};
         {Data, ibrowse_async_response_end} ->
             put(?STREAM_STATUS, ended),
             {Data, fun() -> throw({maybe_retry_req, more_data_expected}) end}
     end.

 accumulate_messages(ReqId, Acc, Timeout) ->
     receive
         {ibrowse_async_response, ReqId, {error, Error}} ->
             throw({maybe_retry_req, Error});
         {ibrowse_async_response, ReqId, <<>>} ->
             accumulate_messages(ReqId, Acc, Timeout);
         {ibrowse_async_response, ReqId, Data} ->
             accumulate_messages(ReqId, [Data | Acc], 0);
         {ibrowse_async_response_end, ReqId} ->
             {iolist_to_binary(lists:reverse(Acc)), ibrowse_async_response_end}
     after Timeout ->
         % Note: ibrowse should always reply with timeouts, but this doesn't
         % seem to be always true when there's a very high rate of requests
         % and many open connections.
         if
             Acc =:= [] ->
                 throw({maybe_retry_req, timeout});
             true ->
                 {iolist_to_binary(lists:reverse(Acc)), ibrowse_async_response}
         end
     end.

 full_url(#httpdb{url = BaseUrl}, Params) ->
     Path = get_value(path, Params, []),
     QueryArgs = get_value(qs, Params, []),
     BaseUrl ++ Path ++ query_args_to_string(QueryArgs, []).

 query_args_to_string([], []) ->
     "";
 query_args_to_string([], Acc) ->
     "?" ++ string:join(lists:reverse(Acc), "&");
 query_args_to_string([{K, V} | Rest], Acc) ->
     query_args_to_string(Rest, [K ++ "=" ++ couch_httpd:quote(V) | Acc]).

 do_redirect(_Worker, Code, Headers, #httpdb{url = Url} = HttpDb, Params, _Cb) ->
     RedirectUrl = redirect_url(Headers, Url),
     {HttpDb2, Params2} = after_redirect(RedirectUrl, Code, HttpDb, Params),
     throw({retry, HttpDb2, Params2}).

 redirect_url(RespHeaders, OrigUrl) ->
     MochiHeaders = mochiweb_headers:make(RespHeaders),
     RedUrl = mochiweb_headers:get_value("Location", MochiHeaders),
     #url{
         host = Host,
         host_type = HostType,
         port = Port,
         % includes query string
         path = Path,
         protocol = Proto
     } = ibrowse_lib:parse_url(RedUrl),
     #url{
         username = User,
         password = Passwd
     } = ibrowse_lib:parse_url(OrigUrl),
     Creds =
         case is_list(User) andalso is_list(Passwd) of
             true ->
                 User ++ ":" ++ Passwd ++ "@";
             false ->
                 []
         end,
     HostPart =
         case HostType of
             ipv6_address ->
                 "[" ++ Host ++ "]";
             _ ->
                 Host
         end,
     atom_to_list(Proto) ++ "://" ++ Creds ++ HostPart ++ ":" ++
         integer_to_list(Port) ++ Path.

 after_redirect(RedirectUrl, 303, HttpDb, Params) ->
     after_redirect(RedirectUrl, HttpDb, ?replace(Params, method, get));
 after_redirect(RedirectUrl, _Code, HttpDb, Params) ->
     after_redirect(RedirectUrl, HttpDb, Params).

 after_redirect(RedirectUrl, HttpDb, Params) ->
     Params2 = lists:keydelete(path, 1, lists:keydelete(qs, 1, Params)),
     {HttpDb#httpdb{url = RedirectUrl}, Params2}.

 backoff_key(HttpDb, Params) ->
     Method = get_value(method, Params, get),
     Url = HttpDb#httpdb.url,
     {Url, Method}.

 backoff(HttpDb, Params) ->
     Key = backoff_key(HttpDb, Params),
     couch_replicator_rate_limiter:failure(Key),
     throw({retry, HttpDb, Params}).

 backoff_success(HttpDb, Params) ->
     Key = backoff_key(HttpDb, Params),
     couch_replicator_rate_limiter:success(Key).

 backoff_before_request(Worker, HttpDb, Params) ->
     Key = backoff_key(HttpDb, Params),
     Limit = couch_replicator_rate_limiter:max_interval(),
     case couch_replicator_rate_limiter:interval(Key) of
         Sleep when Sleep >= Limit ->
             report_error(Worker, HttpDb, Params, max_backoff);
         Sleep when Sleep >= 1 ->
             timer:sleep(Sleep);
         Sleep when Sleep == 0 ->
             ok
     end.

 merge_headers(Headers1, Headers2) when is_list(Headers1), is_list(Headers2) ->
     Empty = mochiweb_headers:empty(),
     Merged = mochiweb_headers:enter_from_list(Headers1 ++ Headers2, Empty),
     mochiweb_headers:to_list(Merged).

 -ifdef(TEST).

 -include_lib("couch/include/couch_eunit.hrl").

 merge_headers_test() ->
     ?assertEqual([], merge_headers([], [])),
     ?assertEqual([{"a", "x"}], merge_headers([], [{"a", "x"}])),
     ?assertEqual([{"a", "x"}], merge_headers([{"a", "x"}], [])),
     ?assertEqual([{"a", "y"}], merge_headers([{"A", "x"}], [{"a", "y"}])),
     ?assertEqual(
         [{"a", "y"}, {"B", "x"}],
         merge_headers(
             [{"B", "x"}],
             [{"a", "y"}]
         )
     ),
     ?assertEqual([{"a", "y"}], merge_headers([{"A", "z"}, {"a", "y"}], [])),
     ?assertEqual([{"a", "y"}], merge_headers([], [{"A", "z"}, {"a", "y"}])).

 -endif.
	% Licensed under the Apache License, Version 2.0 (the "License"); you may not
	% use this file except in compliance with the License. You may obtain a copy of
	% the License at
	%
	% http://www.apache.org/licenses/LICENSE-2.0
	%
	% Unless required by applicable law or agreed to in writing, software
	% distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
	% WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
	% License for the specific language governing permissions and limitations under
	% the License.

	-module(couch_replicator_httpc).

	-include_lib("couch/include/couch_db.hrl").
	-include_lib("ibrowse/include/ibrowse.hrl").
	-include_lib("couch_replicator/include/couch_replicator_api_wrap.hrl").

	-export([setup/1]).
	-export([send_req/3]).
	-export([stop_http_worker/0]).
	-export([full_url/2]).

	-import(couch_util, [
	get_value/2,
	get_value/3
	]).

	-define(replace(L, K, V), lists:keystore(K, 1, L, {K, V})).
	-define(MAX_WAIT, 5 * 60 * 1000).
	-define(STREAM_STATUS, ibrowse_stream_status).
	-define(STOP_HTTP_WORKER, stop_http_worker).

	% This limit is for the number of messages we're willing to discard
	% from an HTTP stream in clean_mailbox/1 before killing the worker
	% and returning. The original intent for clean_mailbox was to remove
	% a single message or two if the changes feed returned before fully
	% consuming the request. This threshold gives us confidence we'll
	% continue to properly close changes feeds while avoiding any case
	% where we may end up processing an unbounded number of messages.
	-define(MAX_DISCARDED_MESSAGES, 16).

	setup(Db) ->
	#httpdb{
	httpc_pool = nil,
	url = Url,
	http_connections = MaxConns,
	proxy_url = ProxyUrl
	} = Db,
	{ok, Pid} = couch_replicator_httpc_pool:start_link(
	Url,
	ProxyUrl,
	[{max_connections, MaxConns}]
	),
	case couch_replicator_auth:initialize(Db#httpdb{httpc_pool = Pid}) of
	{ok, Db1} ->
	{ok, Db1};
	{error, Error} ->
	LogMsg = "~p: auth plugin initialization failed ~p ~p",
	LogUrl = couch_util:url_strip_password(Url),
	couch_log:error(LogMsg, [?MODULE, LogUrl, Error]),
	throw({replication_auth_error, Error})
	end.

	send_req(HttpDb, Params1, Callback) ->
	put(?STREAM_STATUS, init),
	couch_stats:increment_counter([couch_replicator, requests]),
	Params2 = ?replace(
	Params1,
	qs,
	[{K, ?b2l(iolist_to_binary(V))} \|\| {K, V} <- get_value(qs, Params1, [])]
	),
	Params = ?replace(
	Params2,
	ibrowse_options,
	lists:keysort(1, get_value(ibrowse_options, Params2, []))
	),
	{Worker, Response, HttpDb1} = send_ibrowse_req(HttpDb, Params),
	Ret =
	try
	process_response(Response, Worker, HttpDb1, Params, Callback)
	catch
	throw:{retry, NewHttpDb0, NewParams0} ->
	{retry, NewHttpDb0, NewParams0}
	after
	Pool = HttpDb1#httpdb.httpc_pool,
	case get(?STOP_HTTP_WORKER) of
	stop ->
	ok = stop_and_release_worker(Pool, Worker),
	erase(?STOP_HTTP_WORKER);
	undefined ->
	ok = couch_replicator_httpc_pool:release_worker(Pool, Worker)
	end,
	clean_mailbox(Response)
	end,
	% This is necessary to keep this tail-recursive. Calling
	% send_req in the catch clause would turn it into a body
	% recursive call accidentally.
	case Ret of
	{retry, #httpdb{} = NewHttpDb, NewParams} ->
	send_req(NewHttpDb, NewParams, Callback);
	_ ->
	Ret
	end.

	stop_http_worker() ->
	put(?STOP_HTTP_WORKER, stop).

	send_ibrowse_req(#httpdb{headers = BaseHeaders} = HttpDb0, Params) ->
	Method = get_value(method, Params, get),
	UserHeaders = get_value(headers, Params, []),
	Headers1 = merge_headers(BaseHeaders, UserHeaders),
	{Headers2, HttpDb} = couch_replicator_auth:update_headers(HttpDb0, Headers1),
	Url = full_url(HttpDb, Params),
	Body = get_value(body, Params, []),
	case get_value(path, Params) == "_changes" of
	true ->
	Timeout = infinity;
	false ->
	Timeout =
	case config:get("replicator", "request_timeout", "infinity") of
	"infinity" -> infinity;
	Milliseconds -> list_to_integer(Milliseconds)
	end
	end,
	{ok, Worker} = couch_replicator_httpc_pool:get_worker(HttpDb#httpdb.httpc_pool),
	BasicAuthOpts =
	case couch_replicator_utils:get_basic_auth_creds(HttpDb) of
	{undefined, undefined} ->
	[];
	{User, Pass} when is_list(User), is_list(Pass) ->
	[{basic_auth, {User, Pass}}]
	end,
	IbrowseOptions =
	BasicAuthOpts ++
	[
	{response_format, binary},
	{inactivity_timeout, HttpDb#httpdb.timeout}
	\| lists:ukeymerge(
	1,
	get_value(ibrowse_options, Params, []),
	HttpDb#httpdb.ibrowse_options
	)
	],
	backoff_before_request(Worker, HttpDb, Params),
	Response = ibrowse:send_req_direct(
	Worker, Url, Headers2, Method, Body, IbrowseOptions, Timeout
	),
	{Worker, Response, HttpDb}.

	%% Stop worker, wait for it to die, then release it. Make sure it is dead before
	%% releasing it to the pool, so there is not race triggered recycling it again.
	%% The reason is recycling a dying worker, could end up that worker returning
	%% {error, req_timedout} error. While in reality is not really a timeout, just
	%% a race condition.
	stop_and_release_worker(Pool, Worker) ->
	Ref = erlang:monitor(process, Worker),
	ibrowse_http_client:stop(Worker),
	receive
	{'DOWN', Ref, _, _, _} ->
	ok
	end,
	ok = couch_replicator_httpc_pool:release_worker_sync(Pool, Worker).

	process_response({error, sel_conn_closed}, Worker, HttpDb, Params, _Cb) ->
	put(?STOP_HTTP_WORKER, stop),
	maybe_retry(sel_conn_closed, Worker, HttpDb, Params);
	%% This clause handles un-expected connection closing during pipelined requests.
	%% For example, if server responds to a request, sets Connection: close header
	%% and closes the socket, ibrowse will detect that error when it sends
	%% next request.
	process_response({error, connection_closing}, Worker, HttpDb, Params, _Cb) ->
	put(?STOP_HTTP_WORKER, stop),
	maybe_retry({error, connection_closing}, Worker, HttpDb, Params);
	process_response({ibrowse_req_id, ReqId}, Worker, HttpDb, Params, Callback) ->
	process_stream_response(ReqId, Worker, HttpDb, Params, Callback);
	process_response({ok, Code, Headers, Body}, Worker, HttpDb, Params, Callback) ->
	case list_to_integer(Code) of
	R when R =:= 301; R =:= 302; R =:= 303 ->
	backoff_success(HttpDb, Params),
	do_redirect(Worker, R, Headers, HttpDb, Params, Callback);
	429 ->
	backoff(HttpDb, Params);
	Error when Error =:= 408; Error >= 500 ->
	couch_stats:increment_counter([couch_replicator, responses, failure]),
	maybe_retry({code, Error}, Worker, HttpDb, Params);
	Ok when Ok >= 200, Ok < 500 ->
	backoff_success(HttpDb, Params),
	couch_stats:increment_counter([couch_replicator, responses, success]),
	EJson =
	case Body of
	<<>> ->
	null;
	Json ->
	?JSON_DECODE(Json)
	end,
	process_auth_response(HttpDb, Ok, Headers, Params),
	if
	Ok =:= 413 -> put(?STOP_HTTP_WORKER, stop);
	true -> ok
	end,
	Callback(Ok, Headers, EJson)
	end;
	process_response(Error, Worker, HttpDb, Params, _Callback) ->
	maybe_retry(Error, Worker, HttpDb, Params).

	process_stream_response(ReqId, Worker, HttpDb, Params, Callback) ->
	receive
	{ibrowse_async_headers, ReqId, Code, Headers} ->
	case list_to_integer(Code) of
	R when R =:= 301; R =:= 302; R =:= 303 ->
	backoff_success(HttpDb, Params),
	do_redirect(Worker, R, Headers, HttpDb, Params, Callback);
	429 ->
	Timeout = couch_replicator_rate_limiter:max_interval(),
	backoff(HttpDb#httpdb{timeout = Timeout}, Params);
	Error when Error =:= 408; Error >= 500 ->
	couch_stats:increment_counter(
	[couch_replicator, stream_responses, failure]
	),
	report_error(Worker, HttpDb, Params, {code, Error});
	Ok when Ok >= 200, Ok < 500 ->
	backoff_success(HttpDb, Params),
	HttpDb1 = process_auth_response(HttpDb, Ok, Headers, Params),
	StreamDataFun = fun() ->
	stream_data_self(HttpDb1, Params, Worker, ReqId, Callback)
	end,
	put(?STREAM_STATUS, {streaming, Worker}),
	if
	Ok =:= 413 -> put(?STOP_HTTP_WORKER, stop);
	true -> ok
	end,
	ibrowse:stream_next(ReqId),
	try
	Ret = Callback(Ok, Headers, StreamDataFun),
	Ret
	catch
	throw:{maybe_retry_req, connection_closed} ->
	maybe_retry(
	{connection_closed, mid_stream},
	Worker,
	HttpDb1,
	Params
	);
	throw:{maybe_retry_req, Err} ->
	maybe_retry(Err, Worker, HttpDb1, Params)
	end
	end;
	{ibrowse_async_response, ReqId, {error, _} = Error} ->
	couch_stats:increment_counter(
	[couch_replicator, stream_responses, failure]
	),
	maybe_retry(Error, Worker, HttpDb, Params)
	after HttpDb#httpdb.timeout + 500 ->
	% Note: ibrowse should always reply with timeouts, but this doesn't
	% seem to be always true when there's a very high rate of requests
	% and many open connections.
	maybe_retry(timeout, Worker, HttpDb, Params)
	end.

	process_auth_response(HttpDb, Code, Headers, Params) ->
	case couch_replicator_auth:handle_response(HttpDb, Code, Headers) of
	{continue, HttpDb1} ->
	HttpDb1;
	{retry, HttpDb1} ->
	log_retry_error(Params, HttpDb1, 0, Code),
	throw({retry, HttpDb1, Params})
	end.

	% Only streaming HTTP requests send messages back from
	% the ibrowse worker process. We can detect that based
	% on the ibrowse_req_id format. This just drops all
	% messages for the given ReqId on the floor since we're
	% no longer in the HTTP request.

	clean_mailbox(ReqId) ->
	clean_mailbox(ReqId, ?MAX_DISCARDED_MESSAGES).

	clean_mailbox(_ReqId, 0) ->
	case get(?STREAM_STATUS) of
	{streaming, Worker} ->
	% We kill workers that continue to stream us
	% messages after we give up but do not exit
	% our selves. This is because we may be running
	% as an exception unwinds and we don't want to
	% change any of that subtle logic.
	exit(Worker, {timeout, ibrowse_stream_cleanup});
	_ ->
	ok
	end,
	ok;
	clean_mailbox({ibrowse_req_id, ReqId}, Count) when Count > 0 ->
	case get(?STREAM_STATUS) of
	{streaming, Worker} ->
	case is_process_alive(Worker) of
	true ->
	discard_message(ReqId, Worker, Count);
	false ->
	put(?STREAM_STATUS, ended),
	ok
	end;
	Status when Status == init; Status == ended ->
	receive
	{ibrowse_async_response, ReqId, _} ->
	clean_mailbox({ibrowse_req_id, ReqId}, Count - 1);
	{ibrowse_async_response_end, ReqId} ->
	put(?STREAM_STATUS, ended),
	ok
	after 0 ->
	ok
	end
	end;
	clean_mailbox(_, Count) when Count > 0 ->
	ok.

	discard_message(ReqId, Worker, Count) ->
	ibrowse:stream_next(ReqId),
	receive
	{ibrowse_async_response, ReqId, _} ->
	clean_mailbox({ibrowse_req_id, ReqId}, Count - 1);
	{ibrowse_async_response_end, ReqId} ->
	put(?STREAM_STATUS, ended),
	ok
	after 30000 ->
	exit(Worker, {timeout, ibrowse_stream_cleanup}),
	exit({timeout, ibrowse_stream_cleanup})
	end.

	-spec maybe_retry(any(), pid(), #httpdb{}, list()) -> no_return().
	maybe_retry(Error, Worker, #httpdb{retries = 0} = HttpDb, Params) ->
	report_error(Worker, HttpDb, Params, {error, Error});
	maybe_retry(
	Error,
	Worker,
	#httpdb{retries = Retries, wait = Wait} = HttpDb,
	Params
	) ->
	case total_error_time_exceeded(HttpDb) of
	true ->
	report_error(Worker, HttpDb, Params, {error, Error});
	false ->
	ok = timer:sleep(Wait),
	log_retry_error(Params, HttpDb, Wait, Error),
	Wait2 = erlang:min(Wait * 2, ?MAX_WAIT),
	HttpDb1 = HttpDb#httpdb{retries = Retries - 1, wait = Wait2},
	HttpDb2 = update_first_error_timestamp(HttpDb1),
	throw({retry, HttpDb2, Params})
	end.

	% When retrying, check to make total time spent retrying a request is below
	% the current scheduler health threshold. The goal is to not exceed the
	% threshold, otherwise the job which keep retrying too long will still be
	% considered healthy.
	total_error_time_exceeded(#httpdb{first_error_timestamp = nil}) ->
	false;
	total_error_time_exceeded(#httpdb{first_error_timestamp = ErrorTimestamp}) ->
	HealthThresholdSec = couch_replicator_scheduler:health_threshold(),
	% Threshold value is halved because in the calling code the next step
	% is a doubling. Not halving here could mean sleeping too long and
	% exceeding the health threshold.
	ThresholdUSec = (HealthThresholdSec / 2) * 1000000,
	timer:now_diff(os:timestamp(), ErrorTimestamp) > ThresholdUSec.

	% Remember the first time an error occurs. This value is used later to check
	% the total time spend retrying a request. Because retrying is cursive, on
	% successful result #httpdb{} record is reset back to the original value.
	update_first_error_timestamp(#httpdb{first_error_timestamp = nil} = HttpDb) ->
	HttpDb#httpdb{first_error_timestamp = os:timestamp()};
	update_first_error_timestamp(HttpDb) ->
	HttpDb.

	log_retry_error(Params, HttpDb, Wait, Error) ->
	Method = string:to_upper(atom_to_list(get_value(method, Params, get))),
	Url = couch_util:url_strip_password(full_url(HttpDb, Params)),
	couch_log:notice(
	"Retrying ~s request to ~s in ~p seconds due to error ~s",
	[Method, Url, Wait / 1000, error_cause(Error)]
	).

	report_error(_Worker, HttpDb, Params, Error) ->
	Method = string:to_upper(atom_to_list(get_value(method, Params, get))),
	Url = couch_util:url_strip_password(full_url(HttpDb, Params)),
	do_report_error(Url, Method, Error),
	exit({http_request_failed, Method, Url, Error}).

	do_report_error(Url, Method, {code, Code}) ->
	couch_log:error(
	"Replicator, request ~s to ~p failed. The received "
	"HTTP error code is ~p",
	[Method, Url, Code]
	);
	do_report_error(FullUrl, Method, Error) ->
	couch_log:error(
	"Replicator, request ~s to ~p failed due to error ~s",
	[Method, FullUrl, error_cause(Error)]
	).

	error_cause({error, Cause}) ->
	lists:flatten(io_lib:format("~p", [Cause]));
	error_cause(Cause) ->
	lists:flatten(io_lib:format("~p", [Cause])).

	stream_data_self(#httpdb{timeout = T} = HttpDb, Params, Worker, ReqId, Cb) ->
	case accumulate_messages(ReqId, [], T + 500) of
	{Data, ibrowse_async_response} ->
	ibrowse:stream_next(ReqId),
	{Data, fun() -> stream_data_self(HttpDb, Params, Worker, ReqId, Cb) end};
	{Data, ibrowse_async_response_end} ->
	put(?STREAM_STATUS, ended),
	{Data, fun() -> throw({maybe_retry_req, more_data_expected}) end}
	end.

	accumulate_messages(ReqId, Acc, Timeout) ->
	receive
	{ibrowse_async_response, ReqId, {error, Error}} ->
	throw({maybe_retry_req, Error});
	{ibrowse_async_response, ReqId, <<>>} ->
	accumulate_messages(ReqId, Acc, Timeout);
	{ibrowse_async_response, ReqId, Data} ->
	accumulate_messages(ReqId, [Data \| Acc], 0);
	{ibrowse_async_response_end, ReqId} ->
	{iolist_to_binary(lists:reverse(Acc)), ibrowse_async_response_end}
	after Timeout ->
	% Note: ibrowse should always reply with timeouts, but this doesn't
	% seem to be always true when there's a very high rate of requests
	% and many open connections.
	if
	Acc =:= [] ->
	throw({maybe_retry_req, timeout});
	true ->
	{iolist_to_binary(lists:reverse(Acc)), ibrowse_async_response}
	end
	end.

	full_url(#httpdb{url = BaseUrl}, Params) ->
	Path = get_value(path, Params, []),
	QueryArgs = get_value(qs, Params, []),
	BaseUrl ++ Path ++ query_args_to_string(QueryArgs, []).

	query_args_to_string([], []) ->
	"";
	query_args_to_string([], Acc) ->
	"?" ++ string:join(lists:reverse(Acc), "&");
	query_args_to_string([{K, V} \| Rest], Acc) ->
	query_args_to_string(Rest, [K ++ "=" ++ couch_httpd:quote(V) \| Acc]).

	do_redirect(_Worker, Code, Headers, #httpdb{url = Url} = HttpDb, Params, _Cb) ->
	RedirectUrl = redirect_url(Headers, Url),
	{HttpDb2, Params2} = after_redirect(RedirectUrl, Code, HttpDb, Params),
	throw({retry, HttpDb2, Params2}).

	redirect_url(RespHeaders, OrigUrl) ->
	MochiHeaders = mochiweb_headers:make(RespHeaders),
	RedUrl = mochiweb_headers:get_value("Location", MochiHeaders),
	#url{
	host = Host,
	host_type = HostType,
	port = Port,
	% includes query string
	path = Path,
	protocol = Proto
	} = ibrowse_lib:parse_url(RedUrl),
	#url{
	username = User,
	password = Passwd
	} = ibrowse_lib:parse_url(OrigUrl),
	Creds =
	case is_list(User) andalso is_list(Passwd) of
	true ->
	User ++ ":" ++ Passwd ++ "@";
	false ->
	[]
	end,
	HostPart =
	case HostType of
	ipv6_address ->
	"[" ++ Host ++ "]";
	_ ->
	Host
	end,
	atom_to_list(Proto) ++ "://" ++ Creds ++ HostPart ++ ":" ++
	integer_to_list(Port) ++ Path.

	after_redirect(RedirectUrl, 303, HttpDb, Params) ->
	after_redirect(RedirectUrl, HttpDb, ?replace(Params, method, get));
	after_redirect(RedirectUrl, _Code, HttpDb, Params) ->
	after_redirect(RedirectUrl, HttpDb, Params).

	after_redirect(RedirectUrl, HttpDb, Params) ->
	Params2 = lists:keydelete(path, 1, lists:keydelete(qs, 1, Params)),
	{HttpDb#httpdb{url = RedirectUrl}, Params2}.

	backoff_key(HttpDb, Params) ->
	Method = get_value(method, Params, get),
	Url = HttpDb#httpdb.url,
	{Url, Method}.

	backoff(HttpDb, Params) ->
	Key = backoff_key(HttpDb, Params),
	couch_replicator_rate_limiter:failure(Key),
	throw({retry, HttpDb, Params}).

	backoff_success(HttpDb, Params) ->
	Key = backoff_key(HttpDb, Params),
	couch_replicator_rate_limiter:success(Key).

	backoff_before_request(Worker, HttpDb, Params) ->
	Key = backoff_key(HttpDb, Params),
	Limit = couch_replicator_rate_limiter:max_interval(),
	case couch_replicator_rate_limiter:interval(Key) of
	Sleep when Sleep >= Limit ->
	report_error(Worker, HttpDb, Params, max_backoff);
	Sleep when Sleep >= 1 ->
	timer:sleep(Sleep);
	Sleep when Sleep == 0 ->
	ok
	end.

	merge_headers(Headers1, Headers2) when is_list(Headers1), is_list(Headers2) ->
	Empty = mochiweb_headers:empty(),
	Merged = mochiweb_headers:enter_from_list(Headers1 ++ Headers2, Empty),
	mochiweb_headers:to_list(Merged).

	-ifdef(TEST).

	-include_lib("couch/include/couch_eunit.hrl").

	merge_headers_test() ->
	?assertEqual([], merge_headers([], [])),
	?assertEqual([{"a", "x"}], merge_headers([], [{"a", "x"}])),
	?assertEqual([{"a", "x"}], merge_headers([{"a", "x"}], [])),
	?assertEqual([{"a", "y"}], merge_headers([{"A", "x"}], [{"a", "y"}])),
	?assertEqual(
	[{"a", "y"}, {"B", "x"}],
	merge_headers(
	[{"B", "x"}],
	[{"a", "y"}]
	)
	),
	?assertEqual([{"a", "y"}], merge_headers([{"A", "z"}, {"a", "y"}], [])),
	?assertEqual([{"a", "y"}], merge_headers([], [{"A", "z"}, {"a", "y"}])).

	-endif.