| /* ==================================================================== |
| * The Apache Software License, Version 1.1 |
| * |
| * Copyright (c) 2000 The Apache Software Foundation. All rights |
| * reserved. |
| * |
| * Redistribution and use in source and binary forms, with or without |
| * modification, are permitted provided that the following conditions |
| * are met: |
| * |
| * 1. Redistributions of source code must retain the above copyright |
| * notice, this list of conditions and the following disclaimer. |
| * |
| * 2. Redistributions in binary form must reproduce the above copyright |
| * notice, this list of conditions and the following disclaimer in |
| * the documentation and/or other materials provided with the |
| * distribution. |
| * |
| * 3. The end-user documentation included with the redistribution, |
| * if any, must include the following acknowledgment: |
| * "This product includes software developed by the |
| * Apache Software Foundation (http://www.apache.org/)." |
| * Alternately, this acknowledgment may appear in the software itself, |
| * if and wherever such third-party acknowledgments normally appear. |
| * |
| * 4. The names "Apache" and "Apache Software Foundation" must |
| * not be used to endorse or promote products derived from this |
| * software without prior written permission. For written |
| * permission, please contact apache@apache.org. |
| * |
| * 5. Products derived from this software may not be called "Apache", |
| * nor may "Apache" appear in their name, without prior written |
| * permission of the Apache Software Foundation. |
| * |
| * THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESSED OR IMPLIED |
| * WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES |
| * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE |
| * DISCLAIMED. IN NO EVENT SHALL THE APACHE SOFTWARE FOUNDATION OR |
| * ITS CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, |
| * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT |
| * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF |
| * USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND |
| * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, |
| * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT |
| * OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF |
| * SUCH DAMAGE. |
| * ==================================================================== |
| * |
| * This software consists of voluntary contributions made by many |
| * individuals on behalf of the Apache Software Foundation. For more |
| * information on the Apache Software Foundation, please see |
| * <http://www.apache.org/>. |
| * |
| * Portions of this software are based upon public domain software |
| * originally written at the National Center for Supercomputing Applications, |
| * University of Illinois, Urbana-Champaign. |
| */ |
| |
| /* HTTP routines for Apache proxy */ |
| |
| #define CORE_PRIVATE |
| |
| #include "mod_proxy.h" |
| #include "apr_strings.h" |
| #include "apr_buckets.h" |
| #include "util_filter.h" |
| #include "ap_config.h" |
| #include "http_log.h" |
| #include "http_main.h" |
| #include "http_core.h" |
| #include "http_connection.h" |
| #include "util_date.h" |
| |
| /* |
| * Canonicalise http-like URLs. |
| * scheme is the scheme for the URL |
| * url is the URL starting with the first '/' |
| * def_port is the default port for this scheme. |
| */ |
| int ap_proxy_http_canon(request_rec *r, char *url, const char *scheme, int def_port) |
| { |
| char *host, *path, *search, sport[7]; |
| const char *err; |
| int port; |
| |
| /* do syntatic check. |
| * We break the URL into host, port, path, search |
| */ |
| port = def_port; |
| err = ap_proxy_canon_netloc(r->pool, &url, NULL, NULL, &host, &port); |
| if (err) |
| return HTTP_BAD_REQUEST; |
| |
| /* now parse path/search args, according to rfc1738 */ |
| /* N.B. if this isn't a true proxy request, then the URL _path_ |
| * has already been decoded. True proxy requests have r->uri |
| * == r->unparsed_uri, and no others have that property. |
| */ |
| if (r->uri == r->unparsed_uri) { |
| search = strchr(url, '?'); |
| if (search != NULL) |
| *(search++) = '\0'; |
| } |
| else |
| search = r->args; |
| |
| /* process path */ |
| path = ap_proxy_canonenc(r->pool, url, strlen(url), enc_path, r->proxyreq); |
| if (path == NULL) |
| return HTTP_BAD_REQUEST; |
| |
| if (port != def_port) |
| apr_snprintf(sport, sizeof(sport), ":%d", port); |
| else |
| sport[0] = '\0'; |
| |
| r->filename = apr_pstrcat(r->pool, "proxy:", scheme, "://", host, sport, "/", |
| path, (search) ? "?" : "", (search) ? search : "", NULL); |
| return OK; |
| } |
| |
| static const char *proxy_location_reverse_map(request_rec *r, const char *url) |
| { |
| void *sconf; |
| proxy_server_conf *conf; |
| struct proxy_alias *ent; |
| int i, l1, l2; |
| char *u; |
| |
| sconf = r->server->module_config; |
| conf = (proxy_server_conf *)ap_get_module_config(sconf, &proxy_module); |
| l1 = strlen(url); |
| ent = (struct proxy_alias *)conf->raliases->elts; |
| for (i = 0; i < conf->raliases->nelts; i++) { |
| l2 = strlen(ent[i].real); |
| if (l1 >= l2 && strncmp(ent[i].real, url, l2) == 0) { |
| u = apr_pstrcat(r->pool, ent[i].fake, &url[l2], NULL); |
| return ap_construct_url(r->pool, u, r); |
| } |
| } |
| return url; |
| } |
| |
| /* Clear all connection-based headers from the incoming headers table */ |
| static void clear_connection(apr_pool_t *p, apr_table_t *headers) |
| { |
| const char *name; |
| char *next = apr_pstrdup(p, apr_table_get(headers, "Connection")); |
| |
| apr_table_unset(headers, "Proxy-Connection"); |
| if (!next) |
| return; |
| |
| while (*next) { |
| name = next; |
| while (*next && !apr_isspace(*next) && (*next != ',')) |
| ++next; |
| while (*next && (apr_isspace(*next) || (*next == ','))) { |
| *next = '\0'; |
| ++next; |
| } |
| apr_table_unset(headers, name); |
| } |
| apr_table_unset(headers, "Connection"); |
| } |
| |
| /* |
| * This handles http:// URLs, and other URLs using a remote proxy over http |
| * If proxyhost is NULL, then contact the server directly, otherwise |
| * go via the proxy. |
| * Note that if a proxy is used, then URLs other than http: can be accessed, |
| * also, if we have trouble which is clearly specific to the proxy, then |
| * we return DECLINED so that we can try another proxy. (Or the direct |
| * route.) |
| */ |
| int ap_proxy_http_handler(request_rec *r, char *url, |
| const char *proxyhost, int proxyport) |
| { |
| const char *strp; |
| char *strp2; |
| char *desthost; |
| apr_socket_t *sock; |
| int i, len, backasswards, content_length = -1; |
| apr_status_t err; |
| apr_array_header_t *reqhdrs_arr; |
| apr_table_t *resp_hdrs = NULL; |
| apr_table_entry_t *reqhdrs; |
| struct sockaddr_in server; |
| struct in_addr destaddr; |
| char buffer[HUGE_STRING_LEN]; |
| char *buffer2; |
| char portstr[32]; |
| apr_pool_t *p = r->pool; |
| int destport = 0; |
| char *destportstr = NULL; |
| const char *urlptr = NULL; |
| apr_ssize_t cntr; |
| apr_file_t *cachefp = NULL; |
| char *buf; |
| conn_rec *origin; |
| apr_bucket *e; |
| apr_bucket_brigade *bb = apr_brigade_create(r->pool); |
| |
| void *sconf = r->server->module_config; |
| proxy_server_conf *conf = |
| (proxy_server_conf *) ap_get_module_config(sconf, &proxy_module); |
| struct noproxy_entry *npent = (struct noproxy_entry *) conf->noproxies->elts; |
| int nocache = 0; |
| |
| memset(&server, '\0', sizeof(server)); |
| server.sin_family = AF_INET; |
| |
| /* We break the URL into host, port, path-search */ |
| |
| urlptr = strstr(url, "://"); |
| if (urlptr == NULL) |
| return HTTP_BAD_REQUEST; |
| urlptr += 3; |
| destport = DEFAULT_HTTP_PORT; |
| strp = ap_strchr_c(urlptr, '/'); |
| if (strp == NULL) { |
| desthost = apr_pstrdup(p, urlptr); |
| urlptr = "/"; |
| } |
| else { |
| char *q = apr_palloc(p, strp - urlptr + 1); |
| memcpy(q, urlptr, strp - urlptr); |
| q[strp - urlptr] = '\0'; |
| urlptr = strp; |
| desthost = q; |
| } |
| |
| strp2 = ap_strchr(desthost, ':'); |
| if (strp2 != NULL) { |
| *(strp2++) = '\0'; |
| if (apr_isdigit(*strp2)) { |
| destport = atoi(strp2); |
| destportstr = strp2; |
| } |
| } |
| |
| /* check if ProxyBlock directive on this host */ |
| destaddr.s_addr = apr_inet_addr(desthost); |
| for (i = 0; i < conf->noproxies->nelts; i++) { |
| if ((npent[i].name != NULL |
| && ap_strstr_c(desthost, npent[i].name) != NULL) |
| || destaddr.s_addr == npent[i].addr.s_addr |
| || npent[i].name[0] == '*') |
| return ap_proxyerror(r, HTTP_FORBIDDEN, |
| "Connect to remote machine blocked"); |
| } |
| |
| if ((apr_socket_create(&sock, APR_INET, SOCK_STREAM, r->pool)) != APR_SUCCESS) { |
| ap_log_rerror(APLOG_MARK, APLOG_ERR, 0, r, |
| "proxy: error creating socket"); |
| return HTTP_INTERNAL_SERVER_ERROR; |
| } |
| |
| #if !defined(TPF) && !defined(BEOS) |
| if (conf->recv_buffer_size > 0 && apr_setsocketopt(sock, APR_SO_RCVBUF, |
| conf->recv_buffer_size)) { |
| ap_log_rerror(APLOG_MARK, APLOG_ERR, 0, r, |
| "setsockopt(SO_RCVBUF): Failed to set ProxyReceiveBufferSize, using default"); |
| } |
| #endif |
| |
| if (proxyhost != NULL) { |
| err = ap_proxy_doconnect(sock, (char *)proxyhost, proxyport, r); |
| } |
| else { |
| err = ap_proxy_doconnect(sock, (char *)desthost, destport, r); |
| } |
| |
| if (err != APR_SUCCESS) { |
| if (proxyhost != NULL) |
| return DECLINED; /* try again another way */ |
| else |
| return ap_proxyerror(r, HTTP_BAD_GATEWAY, apr_pstrcat(r->pool, |
| "Could not connect to remote machine: ", |
| desthost, NULL)); |
| } |
| |
| origin = ap_new_connection(r->pool, r->server, sock, 0); |
| if (!origin) { |
| /* the peer reset the connection already; ap_new_connection() |
| * closed the socket */ |
| /* XXX somebody that knows what they're doing add an error path */ |
| } |
| |
| ap_add_output_filter("CORE", NULL, NULL, origin); |
| |
| clear_connection(r->pool, r->headers_in); /* Strip connection-based headers */ |
| |
| buf = apr_pstrcat(r->pool, r->method, " ", proxyhost ? url : urlptr, |
| " HTTP/1.0" CRLF, NULL); |
| e = apr_bucket_pool_create(buf, strlen(buf), r->pool); |
| APR_BRIGADE_INSERT_TAIL(bb, e); |
| if (destportstr != NULL && destport != DEFAULT_HTTP_PORT) { |
| buf = apr_pstrcat(r->pool, "Host: ", desthost, ":", destportstr, CRLF, NULL); |
| e = apr_bucket_pool_create(buf, strlen(buf), r->pool); |
| APR_BRIGADE_INSERT_TAIL(bb, e); |
| } |
| else { |
| buf = apr_pstrcat(r->pool, "Host: ", desthost, CRLF, NULL); |
| e = apr_bucket_pool_create(buf, strlen(buf), r->pool); |
| APR_BRIGADE_INSERT_TAIL(bb, e); |
| } |
| |
| if (conf->viaopt == via_block) { |
| /* Block all outgoing Via: headers */ |
| apr_table_unset(r->headers_in, "Via"); |
| } else if (conf->viaopt != via_off) { |
| /* Create a "Via:" request header entry and merge it */ |
| i = ap_get_server_port(r); |
| if (ap_is_default_port(i,r)) { |
| strcpy(portstr,""); |
| } else { |
| apr_snprintf(portstr, sizeof portstr, ":%d", i); |
| } |
| /* Generate outgoing Via: header with/without server comment: */ |
| ap_table_mergen(r->headers_in, "Via", |
| (conf->viaopt == via_full) |
| ? apr_psprintf(p, "%d.%d %s%s (%s)", |
| HTTP_VERSION_MAJOR(r->proto_num), |
| HTTP_VERSION_MINOR(r->proto_num), |
| ap_get_server_name(r), portstr, |
| AP_SERVER_BASEVERSION) |
| : apr_psprintf(p, "%d.%d %s%s", |
| HTTP_VERSION_MAJOR(r->proto_num), |
| HTTP_VERSION_MINOR(r->proto_num), |
| ap_get_server_name(r), portstr) |
| ); |
| } |
| |
| reqhdrs_arr = apr_table_elts(r->headers_in); |
| reqhdrs = (apr_table_entry_t *) reqhdrs_arr->elts; |
| for (i = 0; i < reqhdrs_arr->nelts; i++) { |
| if (reqhdrs[i].key == NULL || reqhdrs[i].val == NULL |
| /* Clear out headers not to send */ |
| || !strcasecmp(reqhdrs[i].key, "Host") /* Already sent */ |
| /* XXX: @@@ FIXME: "Proxy-Authorization" should *only* be |
| * suppressed if THIS server requested the authentication, |
| * not when a frontend proxy requested it! |
| */ |
| || !strcasecmp(reqhdrs[i].key, "Proxy-Authorization")) |
| continue; |
| buf = apr_pstrcat(r->pool, reqhdrs[i].key, ": ", reqhdrs[i].val, CRLF, NULL); |
| e = apr_bucket_pool_create(buf, strlen(buf), r->pool); |
| APR_BRIGADE_INSERT_TAIL(bb, e); |
| |
| } |
| |
| e = apr_bucket_pool_create(CRLF, strlen(CRLF), r->pool); |
| APR_BRIGADE_INSERT_TAIL(bb, e); |
| e = apr_bucket_flush_create(); |
| APR_BRIGADE_INSERT_TAIL(bb, e); |
| |
| ap_pass_brigade(origin->output_filters, bb); |
| /* send the request data, if any. */ |
| |
| if (ap_should_client_block(r)) { |
| while ((i = ap_get_client_block(r, buffer, sizeof buffer)) > 0) { |
| e = apr_bucket_pool_create(buffer, i, r->pool); |
| APR_BRIGADE_INSERT_TAIL(bb, e); |
| } |
| } |
| /* Flush the data to the origin server */ |
| e = apr_bucket_flush_create(); |
| APR_BRIGADE_INSERT_TAIL(bb, e); |
| ap_pass_brigade(origin->output_filters, bb); |
| |
| ap_add_input_filter("HTTP_IN", NULL, NULL, origin); |
| ap_add_input_filter("CORE_IN", NULL, NULL, origin); |
| |
| apr_brigade_destroy(bb); |
| bb = apr_brigade_create(r->pool); |
| |
| /* Tell http_filter to grab the data one line at a time. */ |
| origin->remain = 0; |
| |
| ap_get_brigade(origin->input_filters, bb, AP_MODE_BLOCKING); |
| e = APR_BRIGADE_FIRST(bb); |
| apr_bucket_read(e, (const char **)&buffer2, &len, APR_BLOCK_READ); |
| if (len == -1) { |
| apr_socket_close(sock); |
| ap_log_rerror(APLOG_MARK, APLOG_ERR, 0, r, |
| "ap_get_brigade() - proxy receive - Error reading from remote server %s (length %d)", |
| proxyhost ? proxyhost : desthost, len); |
| return ap_proxyerror(r, HTTP_BAD_GATEWAY, |
| "Error reading from remote server"); |
| } else if (len == 0) { |
| apr_socket_close(sock); |
| return ap_proxyerror(r, HTTP_BAD_GATEWAY, |
| "Document contains no data"); |
| } |
| APR_BUCKET_REMOVE(e); |
| apr_bucket_destroy(e); |
| |
| /* Is it an HTTP/1 response? This is buggy if we ever see an HTTP/1.10 */ |
| if (ap_checkmask(buffer2, "HTTP/#.# ###*")) { |
| int major, minor; |
| if (2 != sscanf(buffer2, "HTTP/%u.%u", &major, &minor)) { |
| major = 1; |
| minor = 0; |
| } |
| |
| /* If not an HTTP/1 message or if the status line was > 8192 bytes */ |
| if (buffer2[5] != '1' || buffer2[len - 1] != '\n') { |
| apr_socket_close(sock); |
| return HTTP_BAD_GATEWAY; |
| } |
| backasswards = 0; |
| buffer2[--len] = '\0'; |
| |
| buffer2[12] = '\0'; |
| r->status = atoi(&buffer2[9]); |
| |
| buffer2[12] = ' '; |
| r->status_line = apr_pstrdup(p, &buffer2[9]); |
| |
| /* read the headers. */ |
| /* N.B. for HTTP/1.0 clients, we have to fold line-wrapped headers */ |
| /* Also, take care with headers with multiple occurences. */ |
| |
| resp_hdrs = ap_proxy_read_headers(r, buffer, HUGE_STRING_LEN, origin); |
| if (resp_hdrs == NULL) { |
| ap_log_error(APLOG_MARK, APLOG_WARNING|APLOG_NOERRNO, 0, r->server, |
| "proxy: Bad HTTP/%d.%d header returned by %s (%s)", |
| major, minor, r->uri, r->method); |
| nocache = 1; /* do not cache this broken file */ |
| } |
| else |
| { |
| clear_connection(p, resp_hdrs); /* Strip Connection hdrs */ |
| if (apr_table_get(resp_hdrs, "Content-type")) { |
| r->content_type = apr_pstrdup(r->pool, apr_table_get(resp_hdrs, "Content-type")); |
| } |
| } |
| |
| if (conf->viaopt != via_off && conf->viaopt != via_block) { |
| /* Create a "Via:" response header entry and merge it */ |
| i = ap_get_server_port(r); |
| if (ap_is_default_port(i,r)) { |
| strcpy(portstr,""); |
| } else { |
| apr_snprintf(portstr, sizeof portstr, ":%d", i); |
| } |
| } |
| } |
| else { |
| /* an http/0.9 response */ |
| backasswards = 1; |
| r->status = 200; |
| r->status_line = "200 OK"; |
| } |
| |
| /* |
| * HTTP/1.0 requires us to accept 3 types of dates, but only generate |
| * one type |
| */ |
| |
| #if 0 |
| if (ap_cache_el_header(c, "Date", &datestr) == APR_SUCCESS) |
| ap_cache_el_header_set(c, "Date", ap_proxy_date_canon(p, datestr)); |
| if (ap_cache_el_header(c, "Last-Modified", &datestr) == APR_SUCCESS) |
| ap_cache_el_header_set(c, "Last-Modified", ap_proxy_date_canon(p, datestr)); |
| if (ap_cache_el_header(c, "Expires", &datestr) == APR_SUCCESS) |
| ap_cache_el_header_set(c, "Expires", ap_proxy_date_canon(p, datestr)); |
| |
| if (ap_cache_el_header(c, "Location", &datestr) == APR_SUCCESS) |
| ap_cache_el_header_set(c, "Location", proxy_location_reverse_map(r, datestr)); |
| if (ap_cache_el_header(c, "URI", &datestr) == APR_SUCCESS) |
| ap_cache_el_header_set(c, "URI", proxy_location_reverse_map(r, datestr)); |
| #endif |
| |
| /* write status line */ |
| #if 0 |
| if (!r->assbackwards) |
| ap_rvputs(r, "HTTP/1.0 ", r->status_line, CRLF, NULL); |
| |
| if (cachefp && apr_file_puts(apr_pstrcat(r->pool, "HTTP/1.0 ", |
| r->status_line, CRLF, NULL), cachefp) != APR_SUCCESS) { |
| ap_log_rerror(APLOG_MARK, APLOG_ERR, 0, r, |
| "proxy: error writing status line to cache"); |
| ap_proxy_cache_error(&c); |
| cachefp = NULL; |
| } |
| #endif |
| |
| #if 0 |
| /* send headers */ |
| ap_cache_el_header_walk(c, ap_proxy_send_hdr_line, r, NULL); |
| #endif |
| /* |
| if (!r->assbackwards) |
| ap_rputs(CRLF, r); |
| */ |
| r->sent_bodyct = 1; |
| /* Is it an HTTP/0.9 response? If so, send the extra data */ |
| if (backasswards) { |
| cntr = len; |
| e = apr_bucket_heap_create(buffer, cntr, 0, NULL); |
| APR_BRIGADE_INSERT_TAIL(bb, e); |
| if (cachefp && apr_file_write(cachefp, buffer, &cntr) != APR_SUCCESS) { |
| ap_log_rerror(APLOG_MARK, APLOG_ERR, 0, r, |
| "proxy: error writing extra data to cache"); |
| } |
| } |
| |
| /* send body */ |
| /* if header only, then cache will be NULL */ |
| /* HTTP/1.0 tells us to read to EOF, rather than content-length bytes */ |
| if (!r->header_only) { |
| proxy_completion pc; |
| pc.content_length = content_length; |
| pc.cache_completion = conf->cache_completion; |
| |
| origin->remain = content_length; |
| while (ap_get_brigade(origin->input_filters, bb, AP_MODE_BLOCKING) == APR_SUCCESS) { |
| if (APR_BUCKET_IS_EOS(APR_BRIGADE_LAST(bb))) { |
| ap_pass_brigade(r->output_filters, bb); |
| break; |
| } |
| ap_pass_brigade(r->output_filters, bb); |
| apr_brigade_destroy(bb); |
| bb = apr_brigade_create(r->pool); |
| } |
| } |
| |
| apr_socket_close(sock); |
| return OK; |
| } |