/[hydra]/hydra/src/cgi.c
ViewVC logotype

Contents of /hydra/src/cgi.c

Parent Directory Parent Directory | Revision Log Revision Log


Revision 1.11 - (show annotations)
Fri Sep 27 21:24:37 2002 UTC (21 years, 6 months ago) by nmav
Branch: MAIN
Changes since 1.10: +3 -1 lines
File MIME type: text/plain
more HIC stuff

1 /*
2 * Boa, an http server
3 * Copyright (C) 1995 Paul Phillips <paulp@go2net.com>
4 * Some changes Copyright (C) 1996,97 Larry Doolittle <ldoolitt@boa.org>
5 * Some changes Copyright (C) 1996 Charles F. Randall <crandall@goldsys.com>
6 * Some changes Copyright (C) 1997-2002 Jon Nelson <jnelson@boa.org>
7 *
8 * This program is free software; you can redistribute it and/or modify
9 * it under the terms of the GNU General Public License as published by
10 * the Free Software Foundation; either version 1, or (at your option)
11 * any later version.
12 *
13 * This program is distributed in the hope that it will be useful,
14 * but WITHOUT ANY WARRANTY; without even the implied warranty of
15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16 * GNU General Public License for more details.
17 *
18 * You should have received a copy of the GNU General Public License
19 * along with this program; if not, write to the Free Software
20 * Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
21 *
22 */
23
24 /* $Id: cgi.c,v 1.10 2002/09/27 21:09:11 nmav Exp $ */
25
26 #include "boa.h"
27
28 static char *env_gen_extra(const char *key, const char *value, int extra);
29
30 int verbose_cgi_logs = 0;
31 /* The +1 is for the the NULL in complete_env */
32 static char *common_cgi_env[COMMON_CGI_COUNT + 1];
33
34 /*
35 * Name: create_common_env
36 *
37 * Description: Set up the environment variables that are common to
38 * all CGI scripts
39 */
40
41 void create_common_env()
42 {
43 int index = 0, i;
44
45
46 /* NOTE NOTE NOTE:
47 If you (the reader) someday modify this chunk of code to
48 handle more "common" CGI environment variables, then bump the
49 value COMMON_CGI_COUNT in defines.h UP
50
51 Also, in the case of document_root and server_admin, two variables
52 that may or may not be defined depending on the way the server
53 is configured, we check for null values and use an empty
54 string to denote a NULL value to the environment, as per the
55 specification. The quote for which follows:
56
57 "In all cases, a missing environment variable is
58 equivalent to a zero-length (NULL) value, and vice versa."
59 */
60 common_cgi_env[index++] = env_gen_extra("PATH",
61 ((cgi_path !=
62 NULL) ? cgi_path :
63 DEFAULT_PATH), 0);
64 common_cgi_env[index++] =
65 env_gen_extra("SERVER_SOFTWARE", SERVER_NAME "/" SERVER_VERSION, 0);
66 common_cgi_env[index++] =
67 env_gen_extra("GATEWAY_INTERFACE", CGI_VERSION, 0);
68
69 /* removed the SERVER_PORT which may change due to SSL support
70 * Also removed the DOCUMENT_ROOT, SERVER_NAME, which are now per request.
71 */
72
73
74 /* NCSA added */
75 /* common_cgi_env[index++] = env_gen_extra("SERVER_ROOT", server_root); */
76
77 /* APACHE added */
78 common_cgi_env[index++] =
79 env_gen_extra("SERVER_ADMIN", server_admin, 0);
80 common_cgi_env[index] = NULL;
81
82 /* Sanity checking -- make *sure* the memory got allocated */
83 if (index > COMMON_CGI_COUNT) {
84 log_error_time();
85 fprintf(stderr, "COMMON_CGI_COUNT not high enough.\n");
86 exit(1);
87 }
88
89 for (i = 0; i < index; ++i) {
90 if (common_cgi_env[i] == NULL) {
91 log_error_time();
92 fprintf(stderr,
93 "Unable to allocate a component of common_cgi_env - out of memory.\n");
94 exit(1);
95 }
96 }
97 }
98
99 void clear_common_env(void)
100 {
101 int i;
102
103 for (i = 0; i <= COMMON_CGI_COUNT; ++i) {
104 if (common_cgi_env[i] != NULL) {
105 free(common_cgi_env[i]);
106 common_cgi_env[i] = NULL;
107 }
108 }
109 }
110
111 /*
112 * Name: env_gen_extra
113 * (and via a not-so-tricky #define, env_gen)
114 * This routine calls malloc: please free the memory when you are done
115 */
116 static char *env_gen_extra(const char *key, const char *value, int extra)
117 {
118 char *result;
119 int key_len, value_len;
120
121 if (value == NULL) /* ServerAdmin may not be defined, eg */
122 value = "";
123 key_len = strlen(key);
124 value_len = strlen(value);
125 /* leave room for '=' sign and null terminator */
126 result = malloc(extra + key_len + value_len + 2);
127 if (result) {
128 memcpy(result + extra, key, key_len);
129 *(result + extra + key_len) = '=';
130 memcpy(result + extra + key_len + 1, value, value_len);
131 *(result + extra + key_len + value_len + 1) = '\0';
132 } else {
133 log_error_time();
134 perror("malloc");
135 log_error_time();
136 fprintf(stderr,
137 "tried to allocate (key=value) extra=%d: %s=%s\n",
138 extra, key, value);
139 }
140 return result;
141 }
142
143 /*
144 * Name: add_cgi_env
145 *
146 * Description: adds a variable to CGI's environment
147 * Used for HTTP_ headers
148 */
149
150 int add_cgi_env(request * req, const char *key, const char *value,
151 int http_prefix)
152 {
153 char *p;
154 int prefix_len;
155
156 if (http_prefix) {
157 prefix_len = 5;
158 } else {
159 prefix_len = 0;
160 }
161
162 if (req->cgi_env_index < CGI_ENV_MAX) {
163 p = env_gen_extra(key, value, prefix_len);
164 if (!p) {
165 log_error_time();
166 fprintf(stderr, "Unable to generate additional CGI Environment"
167 "variable -- ran out of memory!\n");
168 }
169 if (prefix_len)
170 memcpy(p, "HTTP_", 5);
171 req->cgi_env[req->cgi_env_index++] = p;
172 return 1;
173 } else {
174 log_error_time();
175 fprintf(stderr, "Unable to generate additional CGI Environment"
176 "variable -- not enough space!\n");
177 }
178 return 0;
179 }
180
181 #define my_add_cgi_env(req, key, value) { \
182 int ok = add_cgi_env(req, key, value, 0); \
183 if (!ok) return 0; \
184 }
185
186 const char *hydra_method_str(int method)
187 {
188 char *w;
189 switch (method) {
190 case M_POST:
191 w = "POST";
192 break;
193 case M_HEAD:
194 w = "HEAD";
195 break;
196 case M_GET:
197 w = "GET";
198 break;
199 default:
200 w = "UNKNOWN";
201 break;
202 }
203 return w;
204 }
205
206 /*
207 * Name: complete_env
208 *
209 * Description: adds the known client header env variables
210 * and terminates the environment array
211 */
212
213 int complete_env(request * req)
214 {
215 int i;
216 char buf[22];
217 const char *w;
218
219 for (i = 0; common_cgi_env[i]; i++)
220 req->cgi_env[i] = common_cgi_env[i];
221
222 w = hydra_method_str(req->method);
223 my_add_cgi_env(req, "REQUEST_METHOD", w);
224
225 if (req->secure) {
226 simple_itoa(ssl_port, buf);
227 } else {
228 simple_itoa(server_port, buf);
229 }
230 my_add_cgi_env(req, "SERVER_PORT", buf);
231 my_add_cgi_env(req, "SERVER_NAME", req->hostname);
232
233 /* NCSA and APACHE added -- not in CGI spec */
234 /* my_add_cgi_env( req, "DOCUMENT_ROOT", req->document_root); */
235
236 my_add_cgi_env(req, "SERVER_ADDR", req->local_ip_addr);
237 my_add_cgi_env(req, "SERVER_PROTOCOL", req->http_version);
238 my_add_cgi_env(req, "REQUEST_URI", req->request_uri);
239
240 if (req->path_info)
241 my_add_cgi_env(req, "PATH_INFO", req->path_info);
242
243 if (req->path_translated)
244 /* while path_translated depends on path_info,
245 * there are cases when path_translated might
246 * not exist when path_info does
247 */
248 my_add_cgi_env(req, "PATH_TRANSLATED", req->path_translated);
249
250 my_add_cgi_env(req, "SCRIPT_NAME", req->script_name);
251
252 if (req->query_string)
253 my_add_cgi_env(req, "QUERY_STRING", req->query_string);
254 my_add_cgi_env(req, "REMOTE_ADDR", req->remote_ip_addr);
255
256 simple_itoa(req->remote_port, buf);
257 my_add_cgi_env(req, "REMOTE_PORT", buf);
258
259 if (req->method == M_POST) {
260 if (req->content_type) {
261 my_add_cgi_env(req, "CONTENT_TYPE", req->content_type);
262 } else {
263 my_add_cgi_env(req, "CONTENT_TYPE", default_type);
264 }
265 if (req->content_length) {
266 my_add_cgi_env(req, "CONTENT_LENGTH", req->content_length);
267 }
268 }
269 #ifdef ACCEPT_ON
270 if (req->accept[0])
271 my_add_cgi_env(req, "HTTP_ACCEPT", req->accept);
272 #endif
273
274 if (req->cgi_env_index < CGI_ENV_MAX + 1) {
275 req->cgi_env[req->cgi_env_index] = NULL; /* terminate */
276 return 1;
277 }
278 log_error_time();
279 fprintf(stderr, "Not enough space in CGI environment for remainder"
280 " of variables.\n");
281 return 0;
282 }
283
284 /*
285 * Name: make_args_cgi
286 *
287 * Build argv list for a CGI script according to spec
288 *
289 */
290
291 void create_argv(request * req, char **aargv)
292 {
293 char *p, *q, *r;
294 int aargc;
295
296 q = req->query_string;
297 aargv[0] = req->pathname;
298
299 /* here, we handle a special "indexed" query string.
300 * Taken from the CGI/1.1 SPEC:
301 * This is identified by a GET or HEAD request with a query string
302 * with no *unencoded* '=' in it.
303 * For such a request, I'm supposed to parse the search string
304 * into words, according to the following rules:
305
306 search-string = search-word *( "+" search-word )
307 search-word = 1*schar
308 schar = xunreserved | escaped | xreserved
309 xunreserved = alpha | digit | xsafe | extra
310 xsafe = "$" | "-" | "_" | "."
311 xreserved = ";" | "/" | "?" | ":" | "@" | "&"
312
313 After parsing, each word is URL-decoded, optionally encoded in a system
314 defined manner, and then the argument list
315 is set to the list of words.
316
317
318 Thus, schar is alpha|digit|"$"|"-"|"_"|"."|";"|"/"|"?"|":"|"@"|"&"
319
320 As of this writing, escape.pl escapes the following chars:
321
322 "-", "_", ".", "!", "~", "*", "'", "(", ")",
323 "0".."9", "A".."Z", "a".."z",
324 ";", "/", "?", ":", "@", "&", "=", "+", "\$", ","
325
326 Which therefore means
327 "=", "+", "~", "!", "*", "'", "(", ")", ","
328 are *not* escaped and should be?
329 Wait, we don't do any escaping, and nor should we.
330 According to the RFC draft, we unescape and then re-escape
331 in a "system defined manner" (here: none).
332
333 The CGI/1.1 draft (03, latest is 1999???) is very unclear here.
334
335 I am using the latest published RFC, 2396, for what does and does
336 not need escaping.
337
338 Since boa builds the argument list and does not call /bin/sh,
339 (boa uses execve for CGI)
340 */
341
342 if (q && !strchr(q, '=')) {
343 /* we have an 'index' style */
344 q = strdup(q);
345 if (!q) {
346 WARN("unable to strdup 'q' in create_argv!");
347 }
348 for (aargc = 1; q && (aargc < CGI_ARGC_MAX);) {
349 r = q;
350 /* for an index-style CGI, + is used to seperate arguments
351 * an escaped '+' is of no concern to us
352 */
353 if ((p = strchr(q, '+'))) {
354 *p = '\0';
355 q = p + 1;
356 } else {
357 q = NULL;
358 }
359 if (unescape_uri(r, NULL)) {
360 /* printf("parameter %d: %s\n",aargc,r); */
361 aargv[aargc++] = r;
362 }
363 }
364 aargv[aargc] = NULL;
365 } else {
366 aargv[1] = NULL;
367 }
368 }
369
370 /*
371 * Name: init_cgi
372 *
373 * Description: Called for GET/POST requests that refer to ScriptAlias
374 * directories or application/x-httpd-cgi files. Pipes are used for the
375 * communication with the child.
376 * stderr remains tied to our log file; is this good?
377 *
378 * Returns:
379 * 0 - error or NPH, either way the socket is closed
380 * 1 - success
381 */
382
383 int init_cgi(request * req)
384 {
385 int child_pid;
386 int pipes[2];
387
388 SQUASH_KA(req);
389
390 if (req->is_cgi == NPH || req->is_cgi == CGI || req->is_cgi == HIC_CGI) {
391 if (complete_env(req) == 0) {
392 return 0;
393 }
394 }
395 #ifdef FASCIST_LOGGING
396 {
397 int i;
398 for (i = 0; i < req->cgi_env_index; ++i)
399 fprintf(stderr, "%s - environment variable for cgi: \"%s\"\n",
400 __FILE__, req->cgi_env[i]);
401 }
402 #endif
403
404 if (req->is_cgi) {
405 if (pipe(pipes) == -1) {
406 log_error_time();
407 perror("pipe");
408 return 0;
409 }
410
411 /* set the read end of the socket to non-blocking */
412 if (set_nonblock_fd(pipes[0]) == -1) {
413 log_error_time();
414 perror("cgi-fcntl");
415 close(pipes[0]);
416 close(pipes[1]);
417 return 0;
418 }
419 } else {
420 log_error_time();
421 fprintf(stderr, "Non CGI in init_cgi()!\n");
422 return 0;
423 }
424
425 if (req->is_cgi == HIC_CGI) { /* internally handled cgi */
426 /* This is wrong. We must not block here (FIXME!!)
427 */
428 if (hic_send_command(req, pipes[1]) == -1) {
429 log_error_time();
430 fprintf(stderr, "Error in HIC\n");
431 close(pipes[0]);
432 close(pipes[1]);
433 return 0;
434 }
435 } else { /* plain cgi... do fork */
436 child_pid = fork();
437 switch (child_pid) {
438 case -1:
439 /* fork unsuccessful */
440 log_error_time();
441 perror("fork");
442
443 close(pipes[0]);
444 close(pipes[1]);
445
446 send_r_error(req);
447 /* FIXME: There is aproblem here. send_r_error would work
448 for NPH and CGI, but not for GUNZIP. Fix that. */
449 /* i'd like to send_r_error, but.... */
450 return 0;
451 break;
452 case 0:
453 /* child */
454 if (req->is_cgi == CGI || req->is_cgi == NPH) {
455 char *foo = strdup(req->pathname);
456 char *c;
457
458 if (!foo) {
459 WARN("unable to strdup pathname for req->pathname");
460 _exit(1);
461 }
462 c = strrchr(foo, '/');
463 if (c) {
464 ++c;
465 *c = '\0';
466 } else {
467 /* we have a serious problem */
468 log_error_time();
469 perror("chdir");
470 close(pipes[1]);
471 _exit(1);
472 }
473 if (chdir(foo) != 0) {
474 log_error_time();
475 perror("chdir");
476 close(pipes[1]);
477 _exit(1);
478 }
479 }
480 close(pipes[0]);
481 /* tie cgi's STDOUT to it's write end of pipe */
482 if (dup2(pipes[1], STDOUT_FILENO) == -1) {
483 log_error_time();
484 perror("dup2 - pipes");
485 close(pipes[1]);
486 _exit(1);
487 }
488 close(pipes[1]);
489 if (set_block_fd(STDOUT_FILENO) == -1) {
490 log_error_time();
491 perror("cgi-fcntl");
492 _exit(1);
493 }
494
495 /* tie post_data_fd to POST stdin */
496 if (req->method == M_POST) { /* tie stdin to file */
497 lseek(req->post_data_fd, SEEK_SET, 0);
498 dup2(req->post_data_fd, STDIN_FILENO);
499 close(req->post_data_fd);
500 }
501 /* Close access log, so CGI program can't scribble
502 * where it shouldn't
503 */
504 close_access_log();
505
506 /*
507 * tie STDERR to cgi_log_fd
508 * cgi_log_fd will automatically close, close-on-exec rocks!
509 * if we don't tied STDERR (current log_error) to cgi_log_fd,
510 * then we ought to close it.
511 */
512 if (!cgi_log_fd)
513 dup2(devnullfd, STDERR_FILENO);
514 else
515 dup2(cgi_log_fd, STDERR_FILENO);
516
517 if (req->is_cgi == NPH || req->is_cgi == CGI) {
518 char *aargv[CGI_ARGC_MAX + 1];
519 create_argv(req, aargv);
520 execve(req->pathname, aargv, req->cgi_env);
521 } else {
522 if (req->is_cgi == INDEXER_CGI)
523 execl(dirmaker, dirmaker, req->pathname, req->request_uri,
524 NULL);
525 }
526 /* execve failed */
527 WARN(req->pathname);
528 _exit(1);
529
530 break; /* it doesn't matter, we never make it until here */
531
532 default:
533 /* parent */
534 /* if here, fork was successful */
535 if (verbose_cgi_logs) {
536 log_error_time();
537 fprintf(stderr, "Forked child \"%s\" pid %d\n",
538 req->pathname, child_pid);
539 }
540
541 if (req->method == M_POST) {
542 close(req->post_data_fd); /* child closed it too */
543 req->post_data_fd = -1;
544 }
545
546 /* NPH, etc... all go straight to the fd */
547
548 close(pipes[1]);
549 break;
550 }
551 } /* HIC */
552
553 /* we only get here in parent case, and
554 * success.
555 */
556
557 req->data_fd = pipes[0];
558
559 req->status = PIPE_READ;
560 if (req->is_cgi == CGI || req->is_cgi == HIC_CGI) {
561 req->cgi_status = CGI_PARSE; /* got to parse cgi header */
562 /* for cgi_header... I get half the buffer! */
563 req->header_line = req->header_end = (req->buffer + BUFFER_SIZE / 2);
564 } else {
565 req->cgi_status = CGI_BUFFER;
566 /* I get all the buffer! */
567 req->header_line = req->header_end = req->buffer;
568 }
569
570 /* reset req->filepos for logging (it's used in pipe.c) */
571 /* still don't know why req->filesize might be reset though */
572 req->filepos = 0;
573
574 return 1;
575 }

webmaster@linux.gr
ViewVC Help
Powered by ViewVC 1.1.26