1 /* ====================================================================
2 * The Apache Software License, Version 1.1
4 * Copyright (c) 2000-2001 The Apache Software Foundation. All rights
7 * Redistribution and use in source and binary forms, with or without
8 * modification, are permitted provided that the following conditions
11 * 1. Redistributions of source code must retain the above copyright
12 * notice, this list of conditions and the following disclaimer.
14 * 2. Redistributions in binary form must reproduce the above copyright
15 * notice, this list of conditions and the following disclaimer in
16 * the documentation and/or other materials provided with the
19 * 3. The end-user documentation included with the redistribution,
20 * if any, must include the following acknowledgment:
21 * "This product includes software developed by the
22 * Apache Software Foundation (http://www.apache.org/)."
23 * Alternately, this acknowledgment may appear in the software itself,
24 * if and wherever such third-party acknowledgments normally appear.
26 * 4. The names "Apache" and "Apache Software Foundation" must
27 * not be used to endorse or promote products derived from this
28 * software without prior written permission. For written
29 * permission, please contact apache@apache.org.
31 * 5. Products derived from this software may not be called "Apache",
32 * nor may "Apache" appear in their name, without prior written
33 * permission of the Apache Software Foundation.
35 * THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESSED OR IMPLIED
36 * WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
37 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
38 * DISCLAIMED. IN NO EVENT SHALL THE APACHE SOFTWARE FOUNDATION OR
39 * ITS CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
40 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
41 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF
42 * USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
43 * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
44 * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT
45 * OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
47 * ====================================================================
49 * This software consists of voluntary contributions made by many
50 * individuals on behalf of the Apache Software Foundation. For more
51 * information on the Apache Software Foundation, please see
52 * <http://www.apache.org/>.
54 * Portions of this software are based upon public domain software
55 * originally written at the National Center for Supercomputing Applications,
56 * University of Illinois, Urbana-Champaign.
61 #include "apr_strings.h"
63 #define APR_WANT_STRFUNC
71 #include "ap_config.h"
73 #include "http_config.h"
74 #include "http_main.h"
76 #include "http_core.h"
77 #include "http_protocol.h"
78 #include "http_request.h" /* for sub_req_lookup_uri() */
79 #include "util_script.h"
80 #include "apr_date.h" /* For apr_date_parse_http() */
81 #include "util_ebcdic.h"
89 * Various utility functions which are common to a whole lot of
90 * script-type extensions mechanisms, and might as well be gathered
91 * in one place (if only to avoid creating inter-module dependancies
92 * where there don't have to be).
95 #define MALFORMED_MESSAGE "malformed header from script. Bad header="
96 #define MALFORMED_HEADER_LENGTH_TO_SHOW 30
98 static char *http2env(apr_pool_t *a, const char *w)
100 char *res = (char *)apr_palloc(a, sizeof("HTTP_") + strlen(w));
110 while ((c = *w++) != 0) {
111 if (!apr_isalnum(c)) {
115 *cp++ = apr_toupper(c);
123 AP_DECLARE(char **) ap_create_environment(apr_pool_t *p, apr_table_t *t)
125 const apr_array_header_t *env_arr = apr_table_elts(t);
126 const apr_table_entry_t *elts = (const apr_table_entry_t *) env_arr->elts;
127 char **env = (char **) apr_palloc(p, (env_arr->nelts + 2) * sizeof(char *));
133 if (!apr_table_get(t, "TZ")) {
136 env[j++] = apr_pstrcat(p, "TZ=", tz, NULL);
139 for (i = 0; i < env_arr->nelts; ++i) {
143 env[j] = apr_pstrcat(p, elts[i].key, "=", elts[i].val, NULL);
145 if (apr_isdigit(*whack)) {
148 while (*whack != '=') {
149 if (!apr_isalnum(*whack) && *whack != '_') {
161 AP_DECLARE(void) ap_add_common_vars(request_rec *r)
164 server_rec *s = r->server;
165 conn_rec *c = r->connection;
166 const char *rem_logname;
168 #if defined(WIN32) || defined(OS2) || defined(BEOS)
172 const apr_array_header_t *hdrs_arr = apr_table_elts(r->headers_in);
173 const apr_table_entry_t *hdrs = (const apr_table_entry_t *) hdrs_arr->elts;
177 /* use a temporary apr_table_t which we'll overlap onto
178 * r->subprocess_env later
180 e = apr_table_make(r->pool, 25 + hdrs_arr->nelts);
182 /* First, add environment vars from headers... this is as per
183 * CGI specs, though other sorts of scripting interfaces see
187 for (i = 0; i < hdrs_arr->nelts; ++i) {
192 /* A few headers are special cased --- Authorization to prevent
193 * rogue scripts from capturing passwords; content-type and -length
194 * for no particular reason.
197 if (!strcasecmp(hdrs[i].key, "Content-type")) {
198 apr_table_addn(e, "CONTENT_TYPE", hdrs[i].val);
200 else if (!strcasecmp(hdrs[i].key, "Content-length")) {
201 apr_table_addn(e, "CONTENT_LENGTH", hdrs[i].val);
204 * You really don't want to disable this check, since it leaves you
205 * wide open to CGIs stealing passwords and people viewing them
206 * in the environment with "ps -e". But, if you must...
208 #ifndef SECURITY_HOLE_PASS_AUTHORIZATION
209 else if (!strcasecmp(hdrs[i].key, "Authorization")
210 || !strcasecmp(hdrs[i].key, "Proxy-Authorization")) {
215 apr_table_addn(e, http2env(r->pool, hdrs[i].key), hdrs[i].val);
219 if (!(env_path = getenv("PATH"))) {
220 env_path = DEFAULT_PATH;
222 apr_table_addn(e, "PATH", apr_pstrdup(r->pool, env_path));
225 if (env_temp = getenv("SystemRoot")) {
226 apr_table_addn(e, "SystemRoot", env_temp);
228 if (env_temp = getenv("COMSPEC")) {
229 apr_table_addn(e, "COMSPEC", env_temp);
231 if (env_temp = getenv("PATHEXT")) {
232 apr_table_addn(e, "PATHEXT", env_temp);
234 if (env_temp = getenv("WINDIR")) {
235 apr_table_addn(e, "WINDIR", env_temp);
240 if ((env_temp = getenv("COMSPEC")) != NULL) {
241 apr_table_addn(e, "COMSPEC", env_temp);
243 if ((env_temp = getenv("ETC")) != NULL) {
244 apr_table_addn(e, "ETC", env_temp);
246 if ((env_temp = getenv("DPATH")) != NULL) {
247 apr_table_addn(e, "DPATH", env_temp);
249 if ((env_temp = getenv("PERLLIB_PREFIX")) != NULL) {
250 apr_table_addn(e, "PERLLIB_PREFIX", env_temp);
255 if ((env_temp = getenv("LIBRARY_PATH")) != NULL) {
256 apr_table_addn(e, "LIBRARY_PATH", env_temp);
260 apr_table_addn(e, "SERVER_SIGNATURE", ap_psignature("", r));
261 apr_table_addn(e, "SERVER_SOFTWARE", ap_get_server_version());
262 apr_table_addn(e, "SERVER_NAME", ap_get_server_name(r));
263 apr_table_addn(e, "SERVER_ADDR", r->connection->local_ip); /* Apache */
264 apr_table_addn(e, "SERVER_PORT",
265 apr_psprintf(r->pool, "%u", ap_get_server_port(r)));
266 host = ap_get_remote_host(c, r->per_dir_config, REMOTE_HOST, NULL);
268 apr_table_addn(e, "REMOTE_HOST", host);
270 apr_table_addn(e, "REMOTE_ADDR", c->remote_ip);
271 apr_table_addn(e, "DOCUMENT_ROOT", ap_document_root(r)); /* Apache */
272 apr_table_addn(e, "SERVER_ADMIN", s->server_admin); /* Apache */
273 apr_table_addn(e, "SCRIPT_FILENAME", r->filename); /* Apache */
275 apr_sockaddr_port_get(&rport, c->remote_addr);
276 apr_table_addn(e, "REMOTE_PORT", apr_itoa(r->pool, rport));
279 apr_table_addn(e, "REMOTE_USER", r->user);
281 if (r->ap_auth_type) {
282 apr_table_addn(e, "AUTH_TYPE", r->ap_auth_type);
284 rem_logname = ap_get_remote_logname(r);
286 apr_table_addn(e, "REMOTE_IDENT", apr_pstrdup(r->pool, rem_logname));
289 /* Apache custom error responses. If we have redirected set two new vars */
293 apr_table_addn(e, "REDIRECT_QUERY_STRING", r->prev->args);
296 apr_table_addn(e, "REDIRECT_URL", r->prev->uri);
300 apr_table_overlap(r->subprocess_env, e, APR_OVERLAP_TABLES_SET);
303 /* This "cute" little function comes about because the path info on
304 * filenames and URLs aren't always the same. So we take the two,
305 * and find as much of the two that match as possible.
308 AP_DECLARE(int) ap_find_path_info(const char *uri, const char *path_info)
310 int lu = strlen(uri);
311 int lp = strlen(path_info);
313 while (lu-- && lp-- && uri[lu] == path_info[lp]);
319 while (uri[lu] != '\0' && uri[lu] != '/') {
325 /* Obtain the Request-URI from the original request-line, returning
326 * a new string from the request pool containing the URI or "".
328 static char *original_uri(request_rec *r)
332 if (r->the_request == NULL) {
333 return (char *) apr_pcalloc(r->pool, 1);
336 first = r->the_request; /* use the request-line */
338 while (*first && !apr_isspace(*first)) {
339 ++first; /* skip over the method */
341 while (apr_isspace(*first)) {
342 ++first; /* and the space(s) */
346 while (*last && !apr_isspace(*last)) {
347 ++last; /* end at next whitespace */
350 return apr_pstrndup(r->pool, first, last - first);
353 AP_DECLARE(void) ap_add_cgi_vars(request_rec *r)
355 apr_table_t *e = r->subprocess_env;
357 apr_table_setn(e, "GATEWAY_INTERFACE", "CGI/1.1");
358 apr_table_setn(e, "SERVER_PROTOCOL", r->protocol);
359 apr_table_setn(e, "REQUEST_METHOD", r->method);
360 apr_table_setn(e, "QUERY_STRING", r->args ? r->args : "");
361 apr_table_setn(e, "REQUEST_URI", original_uri(r));
363 /* Note that the code below special-cases scripts run from includes,
364 * because it "knows" that the sub_request has been hacked to have the
365 * args and path_info of the original request, and not any that may have
366 * come with the script URI in the include command. Ugh.
369 if (!strcmp(r->protocol, "INCLUDED")) {
370 apr_table_setn(e, "SCRIPT_NAME", r->uri);
371 if (r->path_info && *r->path_info) {
372 apr_table_setn(e, "PATH_INFO", r->path_info);
375 else if (!r->path_info || !*r->path_info) {
376 apr_table_setn(e, "SCRIPT_NAME", r->uri);
379 int path_info_start = ap_find_path_info(r->uri, r->path_info);
381 apr_table_setn(e, "SCRIPT_NAME",
382 apr_pstrndup(r->pool, r->uri, path_info_start));
384 apr_table_setn(e, "PATH_INFO", r->path_info);
387 if (r->path_info && r->path_info[0]) {
389 * To get PATH_TRANSLATED, treat PATH_INFO as a URI path.
390 * Need to re-escape it for this, since the entire URI was
391 * un-escaped before we determined where the PATH_INFO began.
395 pa_req = ap_sub_req_lookup_uri(ap_escape_uri(r->pool, r->path_info), r,
398 if (pa_req->filename) {
399 char *pt = apr_pstrcat(r->pool, pa_req->filename, pa_req->path_info,
402 /* We need to make this a real Windows path name */
403 apr_filepath_merge(&pt, "", pt, APR_FILEPATH_NATIVE, r->pool);
405 apr_table_setn(e, "PATH_TRANSLATED", pt);
407 ap_destroy_sub_req(pa_req);
412 static int set_cookie_doo_doo(void *v, const char *key, const char *val)
414 apr_table_addn(v, key, val);
418 AP_DECLARE(int) ap_scan_script_header_err_core(request_rec *r, char *buffer,
419 int (*getsfunc) (char *, int, void *),
422 char x[MAX_STRING_LEN];
425 int cgi_status = HTTP_OK;
427 apr_table_t *cookie_table;
432 w = buffer ? buffer : x;
434 /* temporary place to hold headers to merge in later */
435 merge = apr_table_make(r->pool, 10);
437 /* The HTTP specification says that it is legal to merge duplicate
438 * headers into one. Some browsers that support Cookies don't like
439 * merged headers and prefer that each Set-Cookie header is sent
440 * separately. Lets humour those browsers by not merging.
441 * Oh what a pain it is.
443 cookie_table = apr_table_make(r->pool, 2);
444 apr_table_do(set_cookie_doo_doo, cookie_table, r->err_headers_out, "Set-Cookie", NULL);
448 if ((*getsfunc) (w, MAX_STRING_LEN - 1, getsfunc_data) == 0) {
449 ap_log_rerror(APLOG_MARK, APLOG_NOERRNO|APLOG_ERR, 0, r,
450 "Premature end of script headers: %s", r->filename);
451 return HTTP_INTERNAL_SERVER_ERROR;
454 /* Delete terminal (CR?)LF */
457 /* Indeed, the host's '\n':
458 '\012' for UNIX; '\015' for MacOS; '\025' for OS/390
459 -- whatever the script generates.
461 if (p > 0 && w[p - 1] == '\n') {
462 if (p > 1 && w[p - 2] == CR) {
471 * If we've finished reading the headers, check to make sure any
472 * HTTP/1.1 conditions are met. If so, we're done; normal processing
473 * will handle the script's output. If not, just return the error.
474 * The appropriate thing to do would be to send the script process a
475 * SIGPIPE to let it know we're ignoring it, close the channel to the
476 * script process, and *then* return the failed-to-meet-condition
477 * error. Otherwise we'd be waiting for the script to finish
478 * blithering before telling the client the output was no good.
479 * However, we don't have the information to do that, so we have to
480 * leave it to an upper layer.
483 int cond_status = OK;
485 if ((cgi_status == HTTP_OK) && (r->method_number == M_GET)) {
486 cond_status = ap_meets_conditions(r);
488 apr_table_overlap(r->err_headers_out, merge,
489 APR_OVERLAP_TABLES_MERGE);
490 if (!apr_is_empty_table(cookie_table)) {
491 /* the cookies have already been copied to the cookie_table */
492 apr_table_unset(r->err_headers_out, "Set-Cookie");
493 r->err_headers_out = apr_table_overlay(r->pool,
494 r->err_headers_out, cookie_table);
499 /* if we see a bogus header don't ignore it. Shout and scream */
501 #if APR_CHARSET_EBCDIC
502 /* Chances are that we received an ASCII header text instead of
503 * the expected EBCDIC header lines. Try to auto-detect:
505 if (!(l = strchr(w, ':'))) {
506 int maybeASCII = 0, maybeEBCDIC = 0;
507 unsigned char *cp, native;
508 apr_size_t inbytes_left, outbytes_left;
510 for (cp = w; *cp != '\0'; ++cp) {
511 native = apr_xlate_conv_byte(ap_hdrs_from_ascii, *cp);
512 if (isprint(*cp) && !isprint(native))
514 if (!isprint(*cp) && isprint(native))
517 if (maybeASCII > maybeEBCDIC) {
518 ap_log_error(APLOG_MARK, APLOG_NOERRNO|APLOG_ERR, 0, r->server,
519 "CGI Interface Error: Script headers apparently ASCII: (CGI = %s)",
521 inbytes_left = outbytes_left = cp - w;
522 apr_xlate_conv_buffer(ap_hdrs_from_ascii,
523 w, &inbytes_left, w, &outbytes_left);
526 #endif /*APR_CHARSET_EBCDIC*/
527 if (!(l = strchr(w, ':'))) {
528 char malformed[(sizeof MALFORMED_MESSAGE) + 1
529 + MALFORMED_HEADER_LENGTH_TO_SHOW];
531 strcpy(malformed, MALFORMED_MESSAGE);
532 strncat(malformed, w, MALFORMED_HEADER_LENGTH_TO_SHOW);
535 /* Soak up all the script output - may save an outright kill */
536 while ((*getsfunc) (w, MAX_STRING_LEN - 1, getsfunc_data)) {
541 ap_log_rerror(APLOG_MARK, APLOG_NOERRNO|APLOG_ERR, 0, r,
542 "%s: %s", malformed, r->filename);
543 return HTTP_INTERNAL_SERVER_ERROR;
547 while (*l && apr_isspace(*l)) {
551 if (!strcasecmp(w, "Content-type")) {
554 /* Nuke trailing whitespace */
556 char *endp = l + strlen(l) - 1;
557 while (endp > l && apr_isspace(*endp)) {
561 tmp = apr_pstrdup(r->pool, l);
562 ap_content_type_tolower(tmp);
563 r->content_type = tmp;
566 * If the script returned a specific status, that's what
567 * we'll use - otherwise we assume 200 OK.
569 else if (!strcasecmp(w, "Status")) {
570 r->status = cgi_status = atoi(l);
571 r->status_line = apr_pstrdup(r->pool, l);
573 else if (!strcasecmp(w, "Location")) {
574 apr_table_set(r->headers_out, w, l);
576 else if (!strcasecmp(w, "Content-Length")) {
577 apr_table_set(r->headers_out, w, l);
579 else if (!strcasecmp(w, "Transfer-Encoding")) {
580 apr_table_set(r->headers_out, w, l);
583 * If the script gave us a Last-Modified header, we can't just
584 * pass it on blindly because of restrictions on future values.
586 else if (!strcasecmp(w, "Last-Modified")) {
587 ap_update_mtime(r, apr_date_parse_http(l));
588 ap_set_last_modified(r);
590 else if (!strcasecmp(w, "Set-Cookie")) {
591 apr_table_add(cookie_table, w, l);
594 apr_table_add(merge, w, l);
601 static int getsfunc_FILE(char *buf, int len, void *f)
603 return apr_file_gets(buf, len, (apr_file_t *) f) == APR_SUCCESS;
606 AP_DECLARE(int) ap_scan_script_header_err(request_rec *r, apr_file_t *f,
609 return ap_scan_script_header_err_core(r, buffer, getsfunc_FILE, f);
618 static int getsfunc_STRING(char *w, int len, void *pvastrs)
620 struct vastrs *strs = (struct vastrs*) pvastrs;
624 if (!strs->curpos || !*strs->curpos)
626 p = ap_strchr_c(strs->curpos, '\n');
630 p = ap_strchr_c(strs->curpos, '\0');
631 t = p - strs->curpos;
634 strncpy (w, strs->curpos, t);
636 if (!strs->curpos[t]) {
638 strs->curpos = va_arg(strs->args, const char *);
645 /* ap_scan_script_header_err_strs() accepts additional const char* args...
646 * each is treated as one or more header lines, and the first non-header
647 * character is returned to **arg, **data. (The first optional arg is
650 AP_DECLARE_NONSTD(int) ap_scan_script_header_err_strs(request_rec *r,
658 va_start(strs.args, termarg);
660 strs.curpos = va_arg(strs.args, char*);
661 res = ap_scan_script_header_err_core(r, buffer, getsfunc_STRING, (void *) &strs);
663 *termch = strs.curpos;