Add support for Websockets with https inspection enabled
[privoxy.git] / jcc.c
1 /*********************************************************************
2  *
3  * File        :  $Source: /cvsroot/ijbswa/current/jcc.c,v $
4  *
5  * Purpose     :  Main file.  Contains main() method, main loop, and
6  *                the main connection-handling function.
7  *
8  * Copyright   :  Written by and Copyright (C) 2001-2020 the
9  *                Privoxy team. https://www.privoxy.org/
10  *
11  *                Based on the Internet Junkbuster originally written
12  *                by and Copyright (C) 1997 Anonymous Coders and
13  *                Junkbusters Corporation.  http://www.junkbusters.com
14  *
15  *                This program is free software; you can redistribute it
16  *                and/or modify it under the terms of the GNU General
17  *                Public License as published by the Free Software
18  *                Foundation; either version 2 of the License, or (at
19  *                your option) any later version.
20  *
21  *                This program is distributed in the hope that it will
22  *                be useful, but WITHOUT ANY WARRANTY; without even the
23  *                implied warranty of MERCHANTABILITY or FITNESS FOR A
24  *                PARTICULAR PURPOSE.  See the GNU General Public
25  *                License for more details.
26  *
27  *                The GNU General Public License should be included with
28  *                this file.  If not, you can view it at
29  *                http://www.gnu.org/copyleft/gpl.html
30  *                or write to the Free Software Foundation, Inc., 59
31  *                Temple Place - Suite 330, Boston, MA  02111-1307, USA.
32  *
33  *********************************************************************/
34
35
36 #include "config.h"
37
38 #include <stdio.h>
39 #include <sys/types.h>
40 #include <stdlib.h>
41 #include <string.h>
42 #include <signal.h>
43 #include <fcntl.h>
44 #include <errno.h>
45 #include <assert.h>
46
47 #ifdef _WIN32
48 # ifndef FEATURE_PTHREAD
49 #  ifndef STRICT
50 #   define STRICT
51 #  endif
52 #  include <winsock2.h>
53 #  include <windows.h>
54 #  include <process.h>
55 # endif /* ndef FEATURE_PTHREAD */
56
57 # include "win32.h"
58 # ifndef _WIN_CONSOLE
59 #  include "w32log.h"
60 # endif /* ndef _WIN_CONSOLE */
61 # include "w32svrapi.h"
62
63 #else /* ifndef _WIN32 */
64
65 # include <unistd.h>
66 # include <sys/wait.h>
67 # include <sys/time.h>
68 # include <sys/stat.h>
69 # include <sys/ioctl.h>
70
71 #ifdef sun
72 #include <sys/termios.h>
73 #endif /* sun */
74
75 #ifdef unix
76 #include <pwd.h>
77 #include <grp.h>
78 #endif
79
80 # include <signal.h>
81
82 # ifdef __BEOS__
83 #  include <socket.h>  /* BeOS has select() for sockets only. */
84 #  include <OS.h>      /* declarations for threads and stuff. */
85 # endif
86
87 #ifdef HAVE_POLL
88 #ifdef __GLIBC__
89 #include <sys/poll.h>
90 #else
91 #include <poll.h>
92 #endif /* def __GLIBC__ */
93 #else
94 # ifndef FD_ZERO
95 #  include <select.h>
96 # endif
97 #warning poll() appears to be unavailable. Your platform will become unsupported in the future.
98 #endif /* HAVE_POLL */
99
100 #endif
101
102 #include "project.h"
103 #include "list.h"
104 #include "jcc.h"
105 #ifdef FEATURE_HTTPS_INSPECTION
106 #include "ssl.h"
107 #endif
108 #include "filters.h"
109 #include "loaders.h"
110 #include "parsers.h"
111 #include "miscutil.h"
112 #include "errlog.h"
113 #include "jbsockets.h"
114 #include "gateway.h"
115 #include "actions.h"
116 #include "cgi.h"
117 #include "loadcfg.h"
118 #include "urlmatch.h"
119 #ifdef FEATURE_CLIENT_TAGS
120 #include "client-tags.h"
121 #endif
122
123 int daemon_mode = 1;
124 struct client_states clients[1];
125 struct file_list     files[1];
126
127 #ifdef FEATURE_STATISTICS
128 int urls_read     = 0;     /* total nr of urls read inc rejected */
129 int urls_rejected = 0;     /* total nr of urls rejected */
130 #endif /* def FEATURE_STATISTICS */
131
132 #ifdef FEATURE_GRACEFUL_TERMINATION
133 int g_terminate = 0;
134 #endif
135
136 #if !defined(_WIN32)
137 static void sig_handler(int the_signal);
138 #endif
139 static int client_protocol_is_unsupported(struct client_state *csp, char *req);
140 static jb_err get_request_destination_elsewhere(struct client_state *csp, struct list *headers);
141 static jb_err get_server_headers(struct client_state *csp);
142 static const char *crunch_reason(const struct http_response *rsp);
143 static void send_crunch_response(struct client_state *csp, struct http_response *rsp);
144 static char *get_request_line(struct client_state *csp);
145 static jb_err receive_client_request(struct client_state *csp);
146 static jb_err parse_client_request(struct client_state *csp);
147 static void build_request_line(struct client_state *csp, const struct forward_spec *fwd, char **request_line);
148 static jb_err change_request_destination(struct client_state *csp);
149 static void handle_established_connection(struct client_state *csp);
150 static void chat(struct client_state *csp);
151 static void serve(struct client_state *csp);
152 #if !defined(_WIN32) || defined(_WIN_CONSOLE)
153 static void usage(const char *myname);
154 #endif
155 static void initialize_mutexes(void);
156 static jb_socket bind_port_helper(const char *haddr, int hport, int backlog);
157 static void bind_ports_helper(struct configuration_spec *config, jb_socket sockets[]);
158 static void close_ports_helper(jb_socket sockets[]);
159 static void listen_loop(void);
160 static void serve(struct client_state *csp);
161
162 #ifdef __BEOS__
163 static int32 server_thread(void *data);
164 #endif /* def __BEOS__ */
165
166 #ifdef _WIN32
167 #define sleep(N)  Sleep(((N) * 1000))
168 #endif
169
170 #ifdef FUZZ
171 int process_fuzzed_input(char *fuzz_input_type, char *fuzz_input_file);
172 void show_fuzz_usage(const char *name);
173 #endif
174
175 #ifdef MUTEX_LOCKS_AVAILABLE
176 /*
177  * XXX: Does the locking stuff really belong in this file?
178  */
179 privoxy_mutex_t log_mutex;
180 privoxy_mutex_t log_init_mutex;
181 privoxy_mutex_t connection_reuse_mutex;
182
183 #ifdef FEATURE_HTTPS_INSPECTION
184 privoxy_mutex_t certificate_mutex;
185 privoxy_mutex_t ssl_init_mutex;
186 #endif
187
188 #ifdef FEATURE_EXTERNAL_FILTERS
189 privoxy_mutex_t external_filter_mutex;
190 #endif
191 #ifdef FEATURE_CLIENT_TAGS
192 privoxy_mutex_t client_tags_mutex;
193 #endif
194 #ifdef FEATURE_EXTENDED_STATISTICS
195 privoxy_mutex_t filter_statistics_mutex;
196 privoxy_mutex_t block_statistics_mutex;
197 #endif
198
199 #if !defined(HAVE_GETHOSTBYADDR_R) || !defined(HAVE_GETHOSTBYNAME_R)
200 privoxy_mutex_t resolver_mutex;
201 #endif /* !defined(HAVE_GETHOSTBYADDR_R) || !defined(HAVE_GETHOSTBYNAME_R) */
202
203 #ifndef HAVE_GMTIME_R
204 privoxy_mutex_t gmtime_mutex;
205 #endif /* ndef HAVE_GMTIME_R */
206
207 #ifndef HAVE_LOCALTIME_R
208 privoxy_mutex_t localtime_mutex;
209 #endif /* ndef HAVE_GMTIME_R */
210
211 #if !defined(HAVE_ARC4RANDOM) && !defined(HAVE_RANDOM)
212 privoxy_mutex_t rand_mutex;
213 #endif /* !defined(HAVE_ARC4RANDOM) && !defined(HAVE_RANDOM) */
214
215 #endif /* def MUTEX_LOCKS_AVAILABLE */
216
217 #if defined(unix)
218 const char *basedir = NULL;
219 const char *pidfile = NULL;
220 static int received_hup_signal = 0;
221 #endif /* defined unix */
222
223 /* HTTP snipplets. */
224 static const char CSUCCEED[] =
225    "HTTP/1.1 200 Connection established\r\n\r\n";
226
227 static const char CHEADER[] =
228    "HTTP/1.1 400 Invalid header received from client\r\n"
229    "Content-Type: text/plain\r\n"
230    "Connection: close\r\n\r\n"
231    "Invalid header received from client.\r\n";
232
233 static const char FTP_RESPONSE[] =
234    "HTTP/1.1 400 Invalid request received from client\r\n"
235    "Content-Type: text/plain\r\n"
236    "Connection: close\r\n\r\n"
237    "Invalid request. Privoxy doesn't support FTP.\r\n";
238
239 static const char GOPHER_RESPONSE[] =
240    "HTTP/1.1 400 Invalid request received from client\r\n"
241    "Content-Type: text/plain\r\n"
242    "Connection: close\r\n\r\n"
243    "Invalid request. Privoxy doesn't support gopher.\r\n";
244
245 /* XXX: should be a template */
246 static const char MISSING_DESTINATION_RESPONSE[] =
247    "HTTP/1.1 400 Bad request received from client\r\n"
248    "Content-Type: text/plain\r\n"
249    "Connection: close\r\n\r\n"
250    "Bad request. Privoxy was unable to extract the destination.\r\n";
251
252 /* XXX: should be a template */
253 static const char INVALID_SERVER_HEADERS_RESPONSE[] =
254    "HTTP/1.1 502 Server or forwarder response invalid\r\n"
255    "Content-Type: text/plain\r\n"
256    "Connection: close\r\n\r\n"
257    "Bad response. The server or forwarder response doesn't look like HTTP.\r\n";
258
259 /* XXX: should be a template */
260 static const char MESSED_UP_REQUEST_RESPONSE[] =
261    "HTTP/1.1 400 Malformed request after rewriting\r\n"
262    "Content-Type: text/plain\r\n"
263    "Connection: close\r\n\r\n"
264    "Bad request. Messed up with header filters.\r\n";
265
266 static const char TOO_MANY_CONNECTIONS_RESPONSE[] =
267    "HTTP/1.1 503 Too many open connections\r\n"
268    "Content-Type: text/plain\r\n"
269    "Connection: close\r\n\r\n"
270    "Maximum number of open connections reached.\r\n";
271
272 static const char CLIENT_CONNECTION_TIMEOUT_RESPONSE[] =
273    "HTTP/1.1 504 Connection timeout\r\n"
274    "Content-Type: text/plain\r\n"
275    "Connection: close\r\n\r\n"
276    "The connection timed out because the client request didn't arrive in time.\r\n";
277
278 static const char CLIENT_BODY_PARSE_ERROR_RESPONSE[] =
279    "HTTP/1.1 400 Failed reading client body\r\n"
280    "Content-Type: text/plain\r\n"
281    "Connection: close\r\n\r\n"
282    "Failed parsing or buffering the chunk-encoded client body.\r\n";
283
284 static const char UNSUPPORTED_CLIENT_EXPECTATION_ERROR_RESPONSE[] =
285    "HTTP/1.1 417 Expecting too much\r\n"
286    "Content-Type: text/plain\r\n"
287    "Connection: close\r\n\r\n"
288    "Privoxy detected an unsupported Expect header value.\r\n";
289
290 /* A function to crunch a response */
291 typedef struct http_response *(*crunch_func_ptr)(struct client_state *);
292
293 /* Crunch function flags */
294 #define CF_NO_FLAGS        0
295 /* Cruncher applies to forced requests as well */
296 #define CF_IGNORE_FORCE    1
297 /* Crunched requests are counted for the block statistics */
298 #define CF_COUNT_AS_REJECT 2
299
300 /* A crunch function and its flags */
301 struct cruncher
302 {
303    const crunch_func_ptr cruncher;
304    const int flags;
305 };
306
307 static int crunch_response_triggered(struct client_state *csp, const struct cruncher crunchers[]);
308
309 /* Complete list of cruncher functions */
310 static const struct cruncher crunchers_all[] = {
311    { direct_response, CF_COUNT_AS_REJECT|CF_IGNORE_FORCE},
312    { block_url,       CF_COUNT_AS_REJECT },
313 #ifdef FEATURE_TRUST
314    { trust_url,       CF_COUNT_AS_REJECT },
315 #endif /* def FEATURE_TRUST */
316    { redirect_url,    CF_NO_FLAGS  },
317    { dispatch_cgi,    CF_IGNORE_FORCE},
318    { NULL,            0 }
319 };
320
321 /* Light version, used after tags are applied */
322 static const struct cruncher crunchers_light[] = {
323    { block_url,       CF_COUNT_AS_REJECT },
324    { redirect_url,    CF_NO_FLAGS },
325    { NULL,            0 }
326 };
327
328
329 /*
330  * XXX: Don't we really mean
331  *
332  * #if defined(unix)
333  *
334  * here?
335  */
336 #if !defined(_WIN32)
337 /*********************************************************************
338  *
339  * Function    :  sig_handler
340  *
341  * Description :  Signal handler for different signals.
342  *                Exit gracefully on TERM and INT
343  *                or set a flag that will cause the errlog
344  *                to be reopened by the main thread on HUP.
345  *
346  * Parameters  :
347  *          1  :  the_signal = the signal cause this function to call
348  *
349  * Returns     :  -
350  *
351  *********************************************************************/
352 static void sig_handler(int the_signal)
353 {
354    switch(the_signal)
355    {
356       case SIGTERM:
357       case SIGINT:
358          log_error(LOG_LEVEL_INFO, "exiting by signal %d .. bye", the_signal);
359 #if defined(unix)
360          if (pidfile)
361          {
362             unlink(pidfile);
363          }
364 #endif /* unix */
365          exit(the_signal);
366          break;
367
368       case SIGHUP:
369 #if defined(unix)
370          received_hup_signal = 1;
371 #endif
372          break;
373
374       default:
375          /*
376           * We shouldn't be here, unless we catch signals
377           * in main() that we can't handle here!
378           */
379          log_error(LOG_LEVEL_FATAL, "sig_handler: exiting on unexpected signal %d", the_signal);
380    }
381    return;
382
383 }
384 #endif
385
386
387 /*********************************************************************
388  *
389  * Function    :  get_write_delay
390  *
391  * Description :  Parse the delay-response parameter.
392  *
393  * Parameters  :
394  *          1  :  csp = Current client state (buffers, headers, etc...)
395  *
396  * Returns     :  Number of milliseconds to delay writes.
397  *
398  *********************************************************************/
399 static unsigned int get_write_delay(const struct client_state *csp)
400 {
401    unsigned int delay;
402    char *endptr;
403    char *newval;
404
405    if ((csp->action->flags & ACTION_DELAY_RESPONSE) == 0)
406    {
407       return 0;
408    }
409    newval = csp->action->string[ACTION_STRING_DELAY_RESPONSE];
410
411    delay = (unsigned)strtol(newval, &endptr, 0);
412    if (*endptr != '\0')
413    {
414       log_error(LOG_LEVEL_FATAL,
415          "Invalid delay-response{} parameter: '%s'", newval);
416    }
417
418    return delay;
419
420 }
421
422
423 /*********************************************************************
424  *
425  * Function    :  client_protocol_is_unsupported
426  *
427  * Description :  Checks if the client used a known unsupported
428  *                protocol and deals with it by sending an error
429  *                response.
430  *
431  * Parameters  :
432  *          1  :  csp = Current client state (buffers, headers, etc...)
433  *          2  :  req = the first request line send by the client
434  *
435  * Returns     :  TRUE if an error response has been generated, or
436  *                FALSE if the request doesn't look invalid.
437  *
438  *********************************************************************/
439 static int client_protocol_is_unsupported(struct client_state *csp, char *req)
440 {
441    /*
442     * If it's a FTP or gopher request, we don't support it.
443     *
444     * These checks are better than nothing, but they might
445     * not work in all configurations and some clients might
446     * have problems digesting the answer.
447     *
448     * They should, however, never cause more problems than
449     * Privoxy's old behaviour (returning the misleading HTML
450     * error message:
451     *
452     * "Could not resolve http://(ftp|gopher)://example.org").
453     */
454    if (!strncmpic(req, "GET ftp://", 10) || !strncmpic(req, "GET gopher://", 13))
455    {
456       const char *response = NULL;
457       const char *protocol = NULL;
458
459       if (!strncmpic(req, "GET ftp://", 10))
460       {
461          response = FTP_RESPONSE;
462          protocol = "FTP";
463       }
464       else
465       {
466          response = GOPHER_RESPONSE;
467          protocol = "GOPHER";
468       }
469       log_error(LOG_LEVEL_ERROR,
470          "%s tried to use Privoxy as %s proxy: %s",
471          csp->ip_addr_str, protocol, req);
472       log_error(LOG_LEVEL_CLF,
473          "%s - - [%T] \"%s\" 400 0", csp->ip_addr_str, req);
474       freez(req);
475
476 #ifdef FEATURE_HTTPS_INSPECTION
477       if (client_use_ssl(csp))
478       {
479          ssl_send_data_delayed(&(csp->ssl_client_attr),
480             (const unsigned char *)response, strlen(response),
481             get_write_delay(csp));
482       }
483       else
484 #endif
485       {
486          write_socket_delayed(csp->cfd, response, strlen(response),
487             get_write_delay(csp));
488       }
489
490       return TRUE;
491    }
492
493    return FALSE;
494 }
495
496
497 /*********************************************************************
498  *
499  * Function    :  client_has_unsupported_expectations
500  *
501  * Description :  Checks if the client used an unsupported expectation
502  *                in which case an error message is delivered.
503  *
504  * Parameters  :
505  *          1  :  csp = Current client state (buffers, headers, etc...)
506  *
507  * Returns     :  TRUE if an error response has been generated, or
508  *                FALSE if the request doesn't look invalid.
509  *
510  *********************************************************************/
511 static int client_has_unsupported_expectations(const struct client_state *csp)
512 {
513    if ((csp->flags & CSP_FLAG_UNSUPPORTED_CLIENT_EXPECTATION))
514    {
515       log_error(LOG_LEVEL_ERROR,
516          "Rejecting request from client %s with unsupported Expect header value",
517          csp->ip_addr_str);
518       log_error(LOG_LEVEL_CLF,
519          "%s - - [%T] \"%s\" 417 0", csp->ip_addr_str, csp->http->cmd);
520       write_socket_delayed(csp->cfd,
521          UNSUPPORTED_CLIENT_EXPECTATION_ERROR_RESPONSE,
522          strlen(UNSUPPORTED_CLIENT_EXPECTATION_ERROR_RESPONSE),
523          get_write_delay(csp));
524
525       return TRUE;
526    }
527
528    return FALSE;
529
530 }
531
532
533 /*********************************************************************
534  *
535  * Function    :  get_request_destination_elsewhere
536  *
537  * Description :  If the client's request was redirected into
538  *                Privoxy without the client's knowledge,
539  *                the request line lacks the destination host.
540  *
541  *                This function tries to get it elsewhere,
542  *                provided accept-intercepted-requests is enabled.
543  *
544  *                "Elsewhere" currently only means "Host: header",
545  *                but in the future we may ask the redirecting
546  *                packet filter to look the destination up.
547  *
548  *                If the destination stays unknown, an error
549  *                response is send to the client and headers
550  *                are freed so that chat() can return directly.
551  *
552  * Parameters  :
553  *          1  :  csp = Current client state (buffers, headers, etc...)
554  *          2  :  headers = a header list
555  *
556  * Returns     :  JB_ERR_OK if the destination is now known, or
557  *                JB_ERR_PARSE if it isn't.
558  *
559  *********************************************************************/
560 static jb_err get_request_destination_elsewhere(struct client_state *csp, struct list *headers)
561 {
562    char *req;
563
564    if (!(csp->config->feature_flags & RUNTIME_FEATURE_ACCEPT_INTERCEPTED_REQUESTS))
565    {
566       log_error(LOG_LEVEL_ERROR, "%s's request: \'%s\' is invalid."
567          " Privoxy isn't configured to accept intercepted requests.",
568          csp->ip_addr_str, csp->http->cmd);
569       /* XXX: Use correct size */
570       log_error(LOG_LEVEL_CLF, "%s - - [%T] \"%s\" 400 0",
571          csp->ip_addr_str, csp->http->cmd);
572
573       write_socket_delayed(csp->cfd, CHEADER, strlen(CHEADER),
574          get_write_delay(csp));
575       destroy_list(headers);
576
577       return JB_ERR_PARSE;
578    }
579    else if (JB_ERR_OK == get_destination_from_headers(headers, csp->http))
580    {
581       /* Split the domain we just got for pattern matching */
582       init_domain_components(csp->http);
583
584       return JB_ERR_OK;
585    }
586    else
587    {
588       /* We can't work without destination. Go spread the news.*/
589
590       req = list_to_text(headers);
591       chomp(req);
592       /* XXX: Use correct size */
593       log_error(LOG_LEVEL_CLF, "%s - - [%T] \"%s\" 400 0",
594          csp->ip_addr_str, csp->http->cmd);
595       log_error(LOG_LEVEL_ERROR,
596          "Privoxy was unable to get the destination for %s's request:\n%s\n%s",
597          csp->ip_addr_str, csp->http->cmd, req);
598       freez(req);
599
600       write_socket_delayed(csp->cfd, MISSING_DESTINATION_RESPONSE,
601          strlen(MISSING_DESTINATION_RESPONSE), get_write_delay(csp));
602       destroy_list(headers);
603
604       return JB_ERR_PARSE;
605    }
606    /*
607     * TODO: If available, use PF's ioctl DIOCNATLOOK as last resort
608     * to get the destination IP address, use it as host directly
609     * or do a reverse DNS lookup first.
610     */
611 }
612
613
614 /*********************************************************************
615  *
616  * Function    :  get_server_headers
617  *
618  * Description :  Parses server headers in iob and fills them
619  *                into csp->headers so that they can later be
620  *                handled by sed().
621  *
622  * Parameters  :
623  *          1  :  csp = Current client state (buffers, headers, etc...)
624  *
625  * Returns     :  JB_ERR_OK if everything went fine, or
626  *                JB_ERR_PARSE if the headers were incomplete.
627  *
628  *********************************************************************/
629 static jb_err get_server_headers(struct client_state *csp)
630 {
631    int continue_hack_in_da_house = 0;
632    char * header;
633
634    while (((header = get_header(csp->iob)) != NULL) || continue_hack_in_da_house)
635    {
636       if (header == NULL)
637       {
638          /*
639           * continue hack in da house. Ignore the ending of
640           * this head and continue enlisting header lines.
641           * The reason is described below.
642           */
643          enlist(csp->headers, "");
644          continue_hack_in_da_house = 0;
645          continue;
646       }
647       else if (0 == strncmpic(header, "HTTP/1.1 100", 12))
648       {
649          /*
650           * It's a bodyless continue response, don't
651           * stop header parsing after reaching its end.
652           *
653           * As a result Privoxy will concatenate the
654           * next response's head and parse and deliver
655           * the headers as if they belonged to one request.
656           *
657           * The client will separate them because of the
658           * empty line between them.
659           *
660           * XXX: What we're doing here is clearly against
661           * the intended purpose of the continue header,
662           * and under some conditions (HTTP/1.0 client request)
663           * it's a standard violation.
664           *
665           * Anyway, "sort of against the spec" is preferable
666           * to "always getting confused by Continue responses"
667           * (Privoxy's behaviour before this hack was added)
668           */
669          log_error(LOG_LEVEL_HEADER, "Continue hack in da house.");
670          continue_hack_in_da_house = 1;
671       }
672       else if (*header == '\0')
673       {
674          /*
675           * If the header is empty, but the Continue hack
676           * isn't active, we can assume that we reached the
677           * end of the buffer before we hit the end of the
678           * head.
679           *
680           * Inform the caller an let it decide how to handle it.
681           */
682          return JB_ERR_PARSE;
683       }
684
685       if (JB_ERR_MEMORY == enlist(csp->headers, header))
686       {
687          /*
688           * XXX: Should we quit the request and return a
689           * out of memory error page instead?
690           */
691          log_error(LOG_LEVEL_ERROR,
692             "Out of memory while enlisting server headers. %s lost.",
693             header);
694       }
695       freez(header);
696    }
697
698    return JB_ERR_OK;
699 }
700
701
702 /*********************************************************************
703  *
704  * Function    :  crunch_reason
705  *
706  * Description :  Translates the crunch reason code into a string.
707  *
708  * Parameters  :
709  *          1  :  rsp = a http_response
710  *
711  * Returns     :  A string with the crunch reason or an error description.
712  *
713  *********************************************************************/
714 static const char *crunch_reason(const struct http_response *rsp)
715 {
716    char * reason = NULL;
717
718    assert(rsp != NULL);
719    if (rsp == NULL)
720    {
721       return "Internal error while searching for crunch reason";
722    }
723
724    switch (rsp->crunch_reason)
725    {
726       case UNSUPPORTED:
727          reason = "Unsupported HTTP feature";
728          break;
729       case BLOCKED:
730          reason = "Blocked";
731          break;
732       case UNTRUSTED:
733          reason = "Untrusted";
734          break;
735       case REDIRECTED:
736          reason = "Redirected";
737          break;
738       case CGI_CALL:
739          reason = "CGI Call";
740          break;
741       case NO_SUCH_DOMAIN:
742          reason = "DNS failure";
743          break;
744       case FORWARDING_FAILED:
745          reason = "Forwarding failed";
746          break;
747       case CONNECT_FAILED:
748          reason = "Connection failure";
749          break;
750       case OUT_OF_MEMORY:
751          reason = "Out of memory (may mask other reasons)";
752          break;
753       case CONNECTION_TIMEOUT:
754          reason = "Connection timeout";
755          break;
756       case NO_SERVER_DATA:
757          reason = "No server data received";
758          break;
759       default:
760          reason = "No reason recorded";
761          break;
762    }
763
764    return reason;
765 }
766
767
768 /*********************************************************************
769  *
770  * Function    :  log_applied_actions
771  *
772  * Description :  Logs the applied actions if LOG_LEVEL_ACTIONS is
773  *                enabled.
774  *
775  * Parameters  :
776  *          1  :  actions = Current action spec to log
777  *
778  * Returns     :  Nothing.
779  *
780  *********************************************************************/
781 static void log_applied_actions(const struct current_action_spec *actions)
782 {
783    /*
784     * The conversion to text requires lots of memory allocations so
785     * we only do the conversion if the user is actually interested.
786     */
787    if (debug_level_is_enabled(LOG_LEVEL_ACTIONS))
788    {
789       char *actions_as_text = actions_to_line_of_text(actions);
790       log_error(LOG_LEVEL_ACTIONS, "%s", actions_as_text);
791       freez(actions_as_text);
792    }
793 }
794
795
796 /*********************************************************************
797  *
798  * Function    :  send_crunch_response
799  *
800  * Description :  Delivers already prepared response for
801  *                intercepted requests, logs the interception
802  *                and frees the response.
803  *
804  * Parameters  :
805  *          1  :  csp = Current client state (buffers, headers, etc...)
806  *          2  :  rsp = Fully prepared response. Will be freed on exit.
807  *
808  * Returns     :  Nothing.
809  *
810  *********************************************************************/
811 static void send_crunch_response(struct client_state *csp, struct http_response *rsp)
812 {
813       const struct http_request *http = csp->http;
814       char status_code[4];
815
816       assert(rsp != NULL);
817       assert(rsp->head != NULL);
818
819       if (rsp == NULL)
820       {
821          log_error(LOG_LEVEL_FATAL, "NULL response in send_crunch_response.");
822       }
823
824       /*
825        * Extract the status code from the actual head
826        * that will be send to the client. It is the only
827        * way to get it right for all requests, including
828        * the fixed ones for out-of-memory problems.
829        *
830        * A head starts like this: 'HTTP/1.1 200...'
831        *                           0123456789|11
832        *                                     10
833        */
834       status_code[0] = rsp->head[9];
835       status_code[1] = rsp->head[10];
836       status_code[2] = rsp->head[11];
837       status_code[3] = '\0';
838
839       /* Log that the request was crunched and why. */
840       log_applied_actions(csp->action);
841 #ifdef FEATURE_HTTPS_INSPECTION
842       if (client_use_ssl(csp))
843       {
844          log_error(LOG_LEVEL_CRUNCH, "%s: https://%s%s", crunch_reason(rsp),
845             http->hostport, http->path);
846          log_error(LOG_LEVEL_CLF, "%s - - [%T] \"%s https://%s%s %s\" %s %lu",
847             csp->ip_addr_str, http->gpc, http->hostport, http->path,
848             http->version, status_code, rsp->content_length);
849       }
850       else
851 #endif
852       {
853          log_error(LOG_LEVEL_CRUNCH, "%s: %s", crunch_reason(rsp), http->url);
854          log_error(LOG_LEVEL_CLF, "%s - - [%T] \"%s\" %s %lu",
855             csp->ip_addr_str, http->ocmd, status_code, rsp->content_length);
856       }
857       /* Write the answer to the client */
858 #ifdef FEATURE_HTTPS_INSPECTION
859       if (client_use_ssl(csp))
860       {
861          if ((ssl_send_data_delayed(&(csp->ssl_client_attr),
862                 (const unsigned char *)rsp->head, rsp->head_length,
863                 get_write_delay(csp)) < 0)
864           || (ssl_send_data_delayed(&(csp->ssl_client_attr),
865                 (const unsigned char *)rsp->body, rsp->content_length,
866                 get_write_delay(csp)) < 0))
867          {
868             /* There is nothing we can do about it. */
869             log_error(LOG_LEVEL_CONNECT, "Couldn't deliver the error message "
870                "for https://%s%s through client socket %d using TLS/SSL",
871                http->hostport, http->url, csp->cfd);
872          }
873       }
874       else
875 #endif
876       {
877          if (write_socket_delayed(csp->cfd, rsp->head, rsp->head_length,
878                 get_write_delay(csp))
879           || write_socket_delayed(csp->cfd, rsp->body, rsp->content_length,
880                 get_write_delay(csp)))
881          {
882             /* There is nothing we can do about it. */
883             log_error(LOG_LEVEL_CONNECT,
884                "Couldn't deliver the error message for %s through client socket %d: %E",
885                http->url, csp->cfd);
886          }
887       }
888
889       /* Clean up and return */
890       if (cgi_error_memory() != rsp)
891       {
892          free_http_response(rsp);
893       }
894       return;
895 }
896
897
898 /*********************************************************************
899  *
900  * Function    :  crunch_response_triggered
901  *
902  * Description :  Checks if the request has to be crunched,
903  *                and delivers the crunch response if necessary.
904  *
905  * Parameters  :
906  *          1  :  csp = Current client state (buffers, headers, etc...)
907  *          2  :  crunchers = list of cruncher functions to run
908  *
909  * Returns     :  TRUE if the request was answered with a crunch response
910  *                FALSE otherwise.
911  *
912  *********************************************************************/
913 static int crunch_response_triggered(struct client_state *csp, const struct cruncher crunchers[])
914 {
915    struct http_response *rsp = NULL;
916    const struct cruncher *c;
917
918    /*
919     * If CGI request crunching is disabled,
920     * check the CGI dispatcher out of order to
921     * prevent unintentional blocks or redirects.
922     */
923    if (!(csp->config->feature_flags & RUNTIME_FEATURE_CGI_CRUNCHING)
924        && (NULL != (rsp = dispatch_cgi(csp))))
925    {
926       /* Deliver, log and free the interception response. */
927       send_crunch_response(csp, rsp);
928       csp->flags |= CSP_FLAG_CRUNCHED;
929       return TRUE;
930    }
931
932    for (c = crunchers; c->cruncher != NULL; c++)
933    {
934       /*
935        * Check the cruncher if either Privoxy is toggled
936        * on and the request isn't forced, or if the cruncher
937        * applies to forced requests as well.
938        */
939       if (((csp->flags & CSP_FLAG_TOGGLED_ON) &&
940           !(csp->flags & CSP_FLAG_FORCED)) ||
941           (c->flags & CF_IGNORE_FORCE))
942       {
943          rsp = c->cruncher(csp);
944          if (NULL != rsp)
945          {
946             /* Deliver, log and free the interception response. */
947             send_crunch_response(csp, rsp);
948             csp->flags |= CSP_FLAG_CRUNCHED;
949 #ifdef FEATURE_STATISTICS
950             if (c->flags & CF_COUNT_AS_REJECT)
951             {
952                csp->flags |= CSP_FLAG_REJECTED;
953             }
954 #endif /* def FEATURE_STATISTICS */
955
956             return TRUE;
957          }
958       }
959    }
960
961    return FALSE;
962 }
963
964
965 /*********************************************************************
966  *
967  * Function    :  build_request_line
968  *
969  * Description :  Builds the HTTP request line.
970  *
971  *                If a HTTP forwarder is used it expects the whole URL,
972  *                web servers only get the path.
973  *
974  * Parameters  :
975  *          1  :  csp = Current client state (buffers, headers, etc...)
976  *          2  :  fwd = The forwarding spec used for the request
977  *                XXX: Should use http->fwd instead.
978  *          3  :  request_line = The old request line which will be replaced.
979  *
980  * Returns     :  Nothing. Terminates in case of memory problems.
981  *
982  *********************************************************************/
983 static void build_request_line(struct client_state *csp, const struct forward_spec *fwd, char **request_line)
984 {
985    struct http_request *http = csp->http;
986
987    /*
988     * Downgrade http version from 1.1 to 1.0
989     * if +downgrade action applies.
990     */
991    if ((csp->action->flags & ACTION_DOWNGRADE)
992      && (!strcmpic(http->version, "HTTP/1.1")))
993    {
994       freez(http->version);
995       http->version = strdup_or_die("HTTP/1.0");
996    }
997
998    /*
999     * Rebuild the request line.
1000     */
1001    freez(*request_line);
1002    *request_line = strdup(http->gpc);
1003    string_append(request_line, " ");
1004
1005    if (fwd->forward_host && fwd->type != FORWARD_WEBSERVER)
1006    {
1007       string_append(request_line, http->url);
1008    }
1009    else
1010    {
1011       string_append(request_line, http->path);
1012    }
1013    string_append(request_line, " ");
1014    string_append(request_line, http->version);
1015
1016    if (*request_line == NULL)
1017    {
1018       log_error(LOG_LEVEL_FATAL, "Out of memory writing HTTP command");
1019    }
1020    log_error(LOG_LEVEL_HEADER, "New HTTP Request-Line: %s", *request_line);
1021 }
1022
1023
1024 /*********************************************************************
1025  *
1026  * Function    :  change_request_destination
1027  *
1028  * Description :  Parse a (rewritten) request line and regenerate
1029  *                the http request data.
1030  *
1031  * Parameters  :
1032  *          1  :  csp = Current client state (buffers, headers, etc...)
1033  *
1034  * Returns     :  Forwards the parse_http_request() return code.
1035  *                Terminates in case of memory problems.
1036  *
1037  *********************************************************************/
1038 static jb_err change_request_destination(struct client_state *csp)
1039 {
1040    struct http_request *http = csp->http;
1041    jb_err err;
1042
1043    log_error(LOG_LEVEL_REDIRECTS, "Rewrite detected: %s",
1044       csp->headers->first->str);
1045    free_http_request(http);
1046    err = parse_http_request(csp->headers->first->str, http);
1047    if (JB_ERR_OK != err)
1048    {
1049       log_error(LOG_LEVEL_ERROR, "Couldn't parse rewritten request: %s.",
1050          jb_err_to_string(err));
1051    }
1052
1053    return err;
1054 }
1055
1056
1057 #ifdef FEATURE_CONNECTION_KEEP_ALIVE
1058 /*********************************************************************
1059  *
1060  * Function    :  server_response_is_complete
1061  *
1062  * Description :  Determines whether we should stop reading
1063  *                from the server socket.
1064  *
1065  * Parameters  :
1066  *          1  :  csp = Current client state (buffers, headers, etc...)
1067  *          2  :  content_length = Length of content received so far.
1068  *
1069  * Returns     :  TRUE if the response is complete,
1070  *                FALSE otherwise.
1071  *
1072  *********************************************************************/
1073 static int server_response_is_complete(struct client_state *csp,
1074    unsigned long long content_length)
1075 {
1076    int content_length_known = !!(csp->flags & CSP_FLAG_CONTENT_LENGTH_SET);
1077
1078    if (!strcmpic(csp->http->gpc, "HEAD"))
1079    {
1080       /*
1081        * "HEAD" implies no body, we are thus expecting
1082        * no content. XXX: incomplete "list" of methods?
1083        */
1084       csp->expected_content_length = 0;
1085       content_length_known = TRUE;
1086       csp->flags |= CSP_FLAG_SERVER_CONTENT_LENGTH_SET;
1087    }
1088
1089    if (csp->http->status == 204 || csp->http->status == 304)
1090    {
1091       /*
1092        * Expect no body. XXX: incomplete "list" of status codes?
1093        */
1094       csp->expected_content_length = 0;
1095       content_length_known = TRUE;
1096       csp->flags |= CSP_FLAG_SERVER_CONTENT_LENGTH_SET;
1097    }
1098
1099    return (content_length_known && ((0 == csp->expected_content_length)
1100             || (csp->expected_content_length <= content_length)));
1101 }
1102
1103
1104 #ifdef FEATURE_CONNECTION_SHARING
1105 /*********************************************************************
1106  *
1107  * Function    :  wait_for_alive_connections
1108  *
1109  * Description :  Waits for alive connections to timeout.
1110  *
1111  * Parameters  :  N/A
1112  *
1113  * Returns     :  N/A
1114  *
1115  *********************************************************************/
1116 static void wait_for_alive_connections(void)
1117 {
1118    int connections_alive = close_unusable_connections();
1119
1120    while (0 < connections_alive)
1121    {
1122       log_error(LOG_LEVEL_CONNECT,
1123          "Waiting for %d connections to timeout.",
1124          connections_alive);
1125       sleep(60);
1126       connections_alive = close_unusable_connections();
1127    }
1128
1129    log_error(LOG_LEVEL_CONNECT, "No connections to wait for left.");
1130
1131 }
1132 #endif /* def FEATURE_CONNECTION_SHARING */
1133
1134
1135 /*********************************************************************
1136  *
1137  * Function    :  save_connection_destination
1138  *
1139  * Description :  Remembers a connection for reuse later on.
1140  *
1141  * Parameters  :
1142  *          1  :  sfd  = Open socket to remember.
1143  *          2  :  http = The destination for the connection.
1144  *          3  :  fwd  = The forwarder settings used.
1145  *          4  :  server_connection  = storage.
1146  *
1147  * Returns     : void
1148  *
1149  *********************************************************************/
1150 void save_connection_destination(jb_socket sfd,
1151                                  const struct http_request *http,
1152                                  const struct forward_spec *fwd,
1153                                  struct reusable_connection *server_connection)
1154 {
1155    assert(sfd != JB_INVALID_SOCKET);
1156    assert(NULL != http->host);
1157
1158    server_connection->sfd = sfd;
1159    server_connection->host = strdup_or_die(http->host);
1160    server_connection->port = http->port;
1161
1162    assert(NULL != fwd);
1163    assert(server_connection->gateway_host == NULL);
1164    assert(server_connection->gateway_port == 0);
1165    assert(server_connection->forwarder_type == 0);
1166    assert(server_connection->forward_host == NULL);
1167    assert(server_connection->forward_port == 0);
1168
1169    server_connection->forwarder_type = fwd->type;
1170    if (NULL != fwd->gateway_host)
1171    {
1172       server_connection->gateway_host = strdup_or_die(fwd->gateway_host);
1173    }
1174    else
1175    {
1176       server_connection->gateway_host = NULL;
1177    }
1178    server_connection->gateway_port = fwd->gateway_port;
1179    if (NULL != fwd->auth_username)
1180    {
1181       server_connection->auth_username = strdup_or_die(fwd->auth_username);
1182    }
1183    else
1184    {
1185       server_connection->auth_username = NULL;
1186    }
1187    if (NULL != fwd->auth_password)
1188    {
1189       server_connection->auth_password = strdup_or_die(fwd->auth_password);
1190    }
1191    else
1192    {
1193       server_connection->auth_password = NULL;
1194    }
1195
1196    if (NULL != fwd->forward_host)
1197    {
1198       server_connection->forward_host = strdup_or_die(fwd->forward_host);
1199    }
1200    else
1201    {
1202       server_connection->forward_host = NULL;
1203    }
1204    server_connection->forward_port = fwd->forward_port;
1205 }
1206 #endif /* FEATURE_CONNECTION_KEEP_ALIVE */
1207
1208
1209 /*********************************************************************
1210  *
1211  * Function    : verify_request_length
1212  *
1213  * Description : Checks if we already got the whole client requests
1214  *               and sets CSP_FLAG_CLIENT_REQUEST_COMPLETELY_READ if
1215  *               we do.
1216  *
1217  *               Data that doesn't belong to the current request is
1218  *               either thrown away to let the client retry on a clean
1219  *               socket, or stashed to be dealt with after the current
1220  *               request is served.
1221  *
1222  * Parameters  :
1223  *          1  :  csp = Current client state (buffers, headers, etc...)
1224  *
1225  * Returns     :  void
1226  *
1227  *********************************************************************/
1228 static void verify_request_length(struct client_state *csp)
1229 {
1230    unsigned long long buffered_request_bytes =
1231       (unsigned long long)(csp->client_iob->eod - csp->client_iob->cur);
1232
1233    if ((csp->expected_client_content_length != 0)
1234       && (buffered_request_bytes != 0))
1235    {
1236       if (csp->expected_client_content_length >= buffered_request_bytes)
1237       {
1238          csp->expected_client_content_length -= buffered_request_bytes;
1239          log_error(LOG_LEVEL_CONNECT, "Reduced expected bytes to %llu "
1240             "to account for the %llu ones we already got.",
1241             csp->expected_client_content_length, buffered_request_bytes);
1242       }
1243       else
1244       {
1245          assert(csp->client_iob->eod > csp->client_iob->cur + csp->expected_client_content_length);
1246          csp->client_iob->eod = csp->client_iob->cur + csp->expected_client_content_length;
1247          log_error(LOG_LEVEL_CONNECT, "Reducing expected bytes to 0. "
1248             "Marking the server socket tainted after throwing %llu bytes away.",
1249             buffered_request_bytes - csp->expected_client_content_length);
1250          csp->expected_client_content_length = 0;
1251          csp->flags |= CSP_FLAG_SERVER_SOCKET_TAINTED;
1252       }
1253
1254       if (csp->expected_client_content_length == 0)
1255       {
1256          csp->flags |= CSP_FLAG_CLIENT_REQUEST_COMPLETELY_READ;
1257       }
1258    }
1259
1260    if (!(csp->flags & CSP_FLAG_CLIENT_REQUEST_COMPLETELY_READ)
1261       && ((csp->client_iob->cur < csp->client_iob->eod)
1262          || (csp->expected_client_content_length != 0)))
1263    {
1264       if (strcmpic(csp->http->gpc, "GET")
1265          && strcmpic(csp->http->gpc, "HEAD")
1266          && strcmpic(csp->http->gpc, "TRACE")
1267          && strcmpic(csp->http->gpc, "OPTIONS")
1268          && strcmpic(csp->http->gpc, "DELETE"))
1269       {
1270          /* XXX: this is an incomplete hack */
1271          csp->flags &= ~CSP_FLAG_CLIENT_REQUEST_COMPLETELY_READ;
1272          log_error(LOG_LEVEL_CONNECT, "There better be a request body.");
1273       }
1274       else
1275       {
1276          csp->flags |= CSP_FLAG_CLIENT_REQUEST_COMPLETELY_READ;
1277
1278          if ((csp->config->feature_flags & RUNTIME_FEATURE_TOLERATE_PIPELINING) == 0)
1279          {
1280             csp->flags |= CSP_FLAG_SERVER_SOCKET_TAINTED;
1281             log_error(LOG_LEVEL_CONNECT,
1282                "Possible pipeline attempt detected. The connection will not "
1283                "be kept alive and we will only serve the first request.");
1284             /* Nuke the pipelined requests from orbit, just to be sure. */
1285             clear_iob(csp->client_iob);
1286          }
1287          else
1288          {
1289             /*
1290              * Keep the pipelined data around for now, we'll deal with
1291              * it once we're done serving the current request.
1292              */
1293             csp->flags |= CSP_FLAG_PIPELINED_REQUEST_WAITING;
1294             assert(csp->client_iob->eod >= csp->client_iob->cur);
1295             log_error(LOG_LEVEL_CONNECT, "Complete client request followed by "
1296                "%d bytes of pipelined data received.",
1297                (int)(csp->client_iob->eod - csp->client_iob->cur));
1298          }
1299       }
1300    }
1301    else
1302    {
1303       csp->flags |= CSP_FLAG_CLIENT_REQUEST_COMPLETELY_READ;
1304       log_error(LOG_LEVEL_CONNECT, "Complete client request received.");
1305    }
1306 }
1307
1308
1309 /*********************************************************************
1310  *
1311  * Function    :  mark_server_socket_tainted
1312  *
1313  * Description :  Makes sure we don't reuse a server socket
1314  *                (if we didn't read everything the server sent
1315  *                us reusing the socket would lead to garbage).
1316  *
1317  * Parameters  :
1318  *          1  :  csp = Current client state (buffers, headers, etc...)
1319  *
1320  * Returns     :  void.
1321  *
1322  *********************************************************************/
1323 static void mark_server_socket_tainted(struct client_state *csp)
1324 {
1325    /*
1326     * For consistency we always mark the server socket
1327     * tainted, however, to reduce the log noise we only
1328     * emit a log message if the server socket could have
1329     * actually been reused.
1330     */
1331    if ((csp->flags & CSP_FLAG_SERVER_CONNECTION_KEEP_ALIVE)
1332       && !(csp->flags & CSP_FLAG_SERVER_SOCKET_TAINTED))
1333    {
1334       log_error(LOG_LEVEL_CONNECT,
1335          "Marking the server socket %d tainted.",
1336          csp->server_connection.sfd);
1337    }
1338    csp->flags |= CSP_FLAG_SERVER_SOCKET_TAINTED;
1339 }
1340
1341 /*********************************************************************
1342  *
1343  * Function    :  get_request_line
1344  *
1345  * Description : Read the client request line.
1346  *
1347  * Parameters  :
1348  *          1  :  csp = Current client state (buffers, headers, etc...)
1349  *
1350  * Returns     :  Pointer to request line or NULL in case of errors.
1351  *
1352  *********************************************************************/
1353 static char *get_request_line(struct client_state *csp)
1354 {
1355    char buf[BUFFER_SIZE];
1356    char *request_line = NULL;
1357    int len;
1358
1359    memset(buf, 0, sizeof(buf));
1360
1361    if ((csp->flags & CSP_FLAG_PIPELINED_REQUEST_WAITING) != 0)
1362    {
1363       /*
1364        * If there are multiple pipelined requests waiting,
1365        * the flag will be set again once the next request
1366        * has been parsed.
1367        */
1368       csp->flags &= ~CSP_FLAG_PIPELINED_REQUEST_WAITING;
1369
1370       request_line = get_header(csp->client_iob);
1371       if ((NULL != request_line) && ('\0' != *request_line))
1372       {
1373          return request_line;
1374       }
1375       else
1376       {
1377          log_error(LOG_LEVEL_CONNECT, "No complete request line "
1378             "received yet. Continuing reading from %d.", csp->cfd);
1379       }
1380    }
1381
1382    do
1383    {
1384       if (
1385 #ifdef FUZZ
1386           0 == (csp->flags & CSP_FLAG_FUZZED_INPUT) &&
1387 #endif
1388           !data_is_available(csp->cfd, csp->config->socket_timeout)
1389           )
1390       {
1391          if (socket_is_still_alive(csp->cfd))
1392          {
1393             log_error(LOG_LEVEL_CONNECT,
1394                "No request line on socket %d received in time. Timeout: %d.",
1395                csp->cfd, csp->config->socket_timeout);
1396             write_socket_delayed(csp->cfd, CLIENT_CONNECTION_TIMEOUT_RESPONSE,
1397                strlen(CLIENT_CONNECTION_TIMEOUT_RESPONSE),
1398                get_write_delay(csp));
1399          }
1400          else
1401          {
1402             log_error(LOG_LEVEL_CONNECT,
1403                "The client side of the connection on socket %d got "
1404                "closed without sending a complete request line.", csp->cfd);
1405          }
1406          return NULL;
1407       }
1408
1409       len = read_socket(csp->cfd, buf, sizeof(buf) - 1);
1410
1411       if (len <= 0) return NULL;
1412
1413       /*
1414        * If there is no memory left for buffering the
1415        * request, there is nothing we can do but hang up
1416        */
1417       if (add_to_iob(csp->client_iob, csp->config->buffer_limit, buf, len))
1418       {
1419          return NULL;
1420       }
1421
1422       request_line = get_header(csp->client_iob);
1423
1424    } while ((NULL != request_line) && ('\0' == *request_line));
1425
1426    return request_line;
1427
1428 }
1429
1430 enum chunk_status
1431 {
1432    CHUNK_STATUS_MISSING_DATA,
1433    CHUNK_STATUS_BODY_COMPLETE,
1434    CHUNK_STATUS_PARSE_ERROR
1435 };
1436
1437
1438 /*********************************************************************
1439  *
1440  * Function    :  chunked_body_is_complete
1441  *
1442  * Description :  Figures out whether or not a chunked body is complete.
1443  *
1444  *                Currently it always starts at the beginning of the
1445  *                buffer which is somewhat wasteful and prevents Privoxy
1446  *                from starting to forward the correctly parsed chunks
1447  *                as soon as theoretically possible.
1448  *
1449  *                Should be modified to work with a common buffer,
1450  *                and allow the caller to skip already parsed chunks.
1451  *
1452  *                This would allow the function to be used for unbuffered
1453  *                response bodies as well.
1454  *
1455  * Parameters  :
1456  *          1  :  iob = Buffer with the body to check.
1457  *          2  :  length = Length of complete body
1458  *
1459  * Returns     :  Enum with the result of the check.
1460  *
1461  *********************************************************************/
1462 static enum chunk_status chunked_body_is_complete(struct iob *iob, size_t *length)
1463 {
1464    unsigned int chunksize;
1465    char *p = iob->cur;
1466
1467    do
1468    {
1469       /*
1470        * We need at least a single digit, followed by "\r\n",
1471        * followed by an unknown amount of data, followed by "\r\n".
1472        */
1473       if (p + 5 > iob->eod)
1474       {
1475          return CHUNK_STATUS_MISSING_DATA;
1476       }
1477       if (sscanf(p, "%x", &chunksize) != 1)
1478       {
1479          return CHUNK_STATUS_PARSE_ERROR;
1480       }
1481
1482       /*
1483        * We want at least a single digit, followed by "\r\n",
1484        * followed by the specified amount of data, followed by "\r\n".
1485        */
1486       if (p + chunksize + 5 > iob->eod)
1487       {
1488          return CHUNK_STATUS_MISSING_DATA;
1489       }
1490
1491       /* Skip chunk-size. */
1492       p = strstr(p, "\r\n");
1493       if (NULL == p)
1494       {
1495          return CHUNK_STATUS_PARSE_ERROR;
1496       }
1497       /* Move beyond the chunkdata. */
1498       p += 2 + chunksize;
1499
1500       /* There should be another "\r\n" to skip */
1501       if (memcmp(p, "\r\n", 2))
1502       {
1503          return CHUNK_STATUS_PARSE_ERROR;
1504       }
1505       p += 2;
1506    } while (chunksize > 0U);
1507
1508    *length = (size_t)(p - iob->cur);
1509    assert(*length <= (size_t)(iob->eod - iob->cur));
1510    assert(p <= iob->eod);
1511
1512    return CHUNK_STATUS_BODY_COMPLETE;
1513
1514 }
1515
1516
1517 /*********************************************************************
1518  *
1519  * Function    : receive_chunked_client_request_body
1520  *
1521  * Description : Read the chunk-encoded client request body.
1522  *               Failures are dealt with.
1523  *
1524  * Parameters  :
1525  *          1  :  csp = Current client state (buffers, headers, etc...)
1526  *
1527  * Returns     :  JB_ERR_OK or JB_ERR_PARSE
1528  *
1529  *********************************************************************/
1530 static jb_err receive_chunked_client_request_body(struct client_state *csp)
1531 {
1532    size_t body_length;
1533    enum chunk_status status;
1534
1535    while (CHUNK_STATUS_MISSING_DATA ==
1536       (status = chunked_body_is_complete(csp->client_iob, &body_length)))
1537    {
1538       char buf[BUFFER_SIZE];
1539       int len;
1540
1541       if (!data_is_available(csp->cfd, csp->config->socket_timeout))
1542       {
1543          log_error(LOG_LEVEL_ERROR,
1544             "Timeout while waiting for the client body.");
1545          break;
1546       }
1547       len = read_socket(csp->cfd, buf, sizeof(buf) - 1);
1548       if (len <= 0)
1549       {
1550          log_error(LOG_LEVEL_ERROR, "Read the client body failed: %E");
1551          break;
1552       }
1553       if (add_to_iob(csp->client_iob, csp->config->buffer_limit, buf, len))
1554       {
1555          break;
1556       }
1557    }
1558    if (status != CHUNK_STATUS_BODY_COMPLETE)
1559    {
1560       write_socket_delayed(csp->cfd, CLIENT_BODY_PARSE_ERROR_RESPONSE,
1561          strlen(CLIENT_BODY_PARSE_ERROR_RESPONSE), get_write_delay(csp));
1562       log_error(LOG_LEVEL_CLF,
1563          "%s - - [%T] \"Failed reading chunked client body\" 400 0", csp->ip_addr_str);
1564       return JB_ERR_PARSE;
1565    }
1566    log_error(LOG_LEVEL_CONNECT,
1567       "Chunked client body completely read. Length: %lu", body_length);
1568    csp->expected_client_content_length = body_length;
1569
1570    return JB_ERR_OK;
1571
1572 }
1573
1574
1575 #ifdef FUZZ
1576 /*********************************************************************
1577  *
1578  * Function    :  fuzz_chunked_transfer_encoding
1579  *
1580  * Description :  Treat the fuzzed input as chunked transfer encoding
1581  *                to check and dechunk.
1582  *
1583  * Parameters  :
1584  *          1  :  csp      = Used to store the data.
1585  *          2  :  fuzz_input_file = File to read the input from.
1586  *
1587  * Returns     : Result of dechunking
1588  *
1589  *********************************************************************/
1590 extern int fuzz_chunked_transfer_encoding(struct client_state *csp, char *fuzz_input_file)
1591 {
1592    size_t length;
1593    size_t size = (size_t)(csp->iob->eod - csp->iob->cur);
1594    enum chunk_status status;
1595
1596    status = chunked_body_is_complete(csp->iob, &length);
1597    if (CHUNK_STATUS_BODY_COMPLETE != status)
1598    {
1599       log_error(LOG_LEVEL_INFO, "Chunked body is incomplete or invalid");
1600    }
1601
1602    return (JB_ERR_OK == remove_chunked_transfer_coding(csp->iob->cur, &size));
1603
1604 }
1605
1606
1607 /*********************************************************************
1608  *
1609  * Function    : fuzz_client_request
1610  *
1611  * Description : Try to get a client request from the fuzzed input.
1612  *
1613  * Parameters  :
1614  *          1  :  csp = Current client state (buffers, headers, etc...)
1615  *          2  :  fuzz_input_file = File to read the input from.
1616  *
1617  * Returns     :  Result of fuzzing.
1618  *
1619  *********************************************************************/
1620 extern int fuzz_client_request(struct client_state *csp, char *fuzz_input_file)
1621 {
1622    jb_err err;
1623
1624    csp->cfd = 0;
1625    csp->ip_addr_str = "fuzzer";
1626
1627    if (strcmp(fuzz_input_file, "-") != 0)
1628    {
1629       log_error(LOG_LEVEL_FATAL,
1630          "Fuzzed client requests can currently only be read from stdin (-).");
1631    }
1632    err = receive_client_request(csp);
1633    if (err != JB_ERR_OK)
1634    {
1635       return 1;
1636    }
1637    err = parse_client_request(csp);
1638    if (err != JB_ERR_OK)
1639    {
1640       return 1;
1641    }
1642
1643    return 0;
1644
1645 }
1646 #endif  /* def FUZZ */
1647
1648
1649 #ifdef FEATURE_FORCE_LOAD
1650 /*********************************************************************
1651  *
1652  * Function    :  force_required
1653  *
1654  * Description : Checks a request line to see if it contains
1655  *               the FORCE_PREFIX. If it does, it is removed
1656  *               unless enforcing requests has beend disabled.
1657  *
1658  * Parameters  :
1659  *          1  :  request_line = HTTP request line
1660  *
1661  * Returns     :  TRUE if force is required, FALSE otherwise.
1662  *
1663  *********************************************************************/
1664 static int force_required(const struct client_state *csp, char *request_line)
1665 {
1666    char *p;
1667
1668    p = strstr(request_line, "http://");
1669    if (p != NULL)
1670    {
1671       /* Skip protocol */
1672       p += strlen("http://");
1673    }
1674    else
1675    {
1676       /* Intercepted request usually don't specify the protocol. */
1677       p = request_line;
1678    }
1679
1680    /* Go to the beginning of the path */
1681    p = strstr(p, "/");
1682    if (p == NULL)
1683    {
1684       /*
1685        * If the path is missing the request line is invalid and we
1686        * are done here. The client-visible rejection happens later on.
1687        */
1688       return 0;
1689    }
1690
1691    if (0 == strncmpic(p, FORCE_PREFIX, strlen(FORCE_PREFIX) - 1))
1692    {
1693       if (!(csp->config->feature_flags & RUNTIME_FEATURE_ENFORCE_BLOCKS))
1694       {
1695          /* XXX: Should clean more carefully */
1696          strclean(request_line, FORCE_PREFIX);
1697          log_error(LOG_LEVEL_FORCE,
1698             "Enforcing request: \"%s\".", request_line);
1699
1700          return 1;
1701       }
1702       log_error(LOG_LEVEL_FORCE,
1703          "Ignored force prefix in request: \"%s\".", request_line);
1704    }
1705
1706    return 0;
1707
1708 }
1709 #endif /* def FEATURE_FORCE_LOAD */
1710
1711
1712 /*********************************************************************
1713  *
1714  * Function    :  receive_client_request
1715  *
1716  * Description : Read the client's request (more precisely the
1717  *               client headers) and answer it if necessary.
1718  *
1719  * Parameters  :
1720  *          1  :  csp = Current client state (buffers, headers, etc...)
1721  *
1722  * Returns     :  JB_ERR_OK, JB_ERR_PARSE or JB_ERR_MEMORY
1723  *
1724  *********************************************************************/
1725 static jb_err receive_client_request(struct client_state *csp)
1726 {
1727    char buf[BUFFER_SIZE];
1728    char *p;
1729    char *req = NULL;
1730    struct http_request *http;
1731    int len;
1732    jb_err err;
1733
1734    /* Temporary copy of the client's headers before they get enlisted in csp->headers */
1735    struct list header_list;
1736    struct list *headers = &header_list;
1737
1738    /* We don't care if the arriving data is a valid HTTP request or not. */
1739    csp->requests_received_total++;
1740
1741    http = csp->http;
1742
1743    memset(buf, 0, sizeof(buf));
1744
1745    req = get_request_line(csp);
1746    if (req == NULL)
1747    {
1748       mark_server_socket_tainted(csp);
1749       return JB_ERR_PARSE;
1750    }
1751    assert(*req != '\0');
1752
1753    if (client_protocol_is_unsupported(csp, req))
1754    {
1755       return JB_ERR_PARSE;
1756    }
1757
1758 #ifdef FEATURE_FORCE_LOAD
1759    if (force_required(csp, req))
1760    {
1761       csp->flags |= CSP_FLAG_FORCED;
1762    }
1763 #endif /* def FEATURE_FORCE_LOAD */
1764
1765    err = parse_http_request(req, http);
1766    freez(req);
1767    if (JB_ERR_OK != err)
1768    {
1769       write_socket_delayed(csp->cfd, CHEADER, strlen(CHEADER),
1770          get_write_delay(csp));
1771       /* XXX: Use correct size */
1772       log_error(LOG_LEVEL_CLF, "%s - - [%T] \"Invalid request\" 400 0", csp->ip_addr_str);
1773       log_error(LOG_LEVEL_ERROR,
1774          "Couldn't parse request line received from %s: %s",
1775          csp->ip_addr_str, jb_err_to_string(err));
1776
1777       free_http_request(http);
1778       return JB_ERR_PARSE;
1779    }
1780
1781    /* grab the rest of the client's headers */
1782    init_list(headers);
1783    for (;;)
1784    {
1785       p = get_header(csp->client_iob);
1786
1787       if (p == NULL)
1788       {
1789          /* There are no additional headers to read. */
1790          break;
1791       }
1792
1793       if (*p == '\0')
1794       {
1795          /*
1796           * We didn't receive a complete header
1797           * line yet, get the rest of it.
1798           */
1799          if (!data_is_available(csp->cfd, csp->config->socket_timeout))
1800          {
1801             log_error(LOG_LEVEL_ERROR,
1802                "Stopped grabbing the client headers.");
1803             destroy_list(headers);
1804             return JB_ERR_PARSE;
1805          }
1806
1807          len = read_socket(csp->cfd, buf, sizeof(buf) - 1);
1808          if (len <= 0)
1809          {
1810             log_error(LOG_LEVEL_ERROR, "read from client failed: %E");
1811             destroy_list(headers);
1812             return JB_ERR_PARSE;
1813          }
1814
1815          if (add_to_iob(csp->client_iob, csp->config->buffer_limit, buf, len))
1816          {
1817             /*
1818              * If there is no memory left for buffering the
1819              * request, there is nothing we can do but hang up
1820              */
1821             destroy_list(headers);
1822             return JB_ERR_MEMORY;
1823          }
1824       }
1825       else
1826       {
1827          if (!strncmpic(p, "Transfer-Encoding:", 18))
1828          {
1829             /*
1830              * XXX: should be called through sed()
1831              *      but currently can't.
1832              */
1833             client_transfer_encoding(csp, &p);
1834          }
1835          /*
1836           * We were able to read a complete
1837           * header and can finally enlist it.
1838           */
1839          enlist(headers, p);
1840          freez(p);
1841       }
1842    }
1843
1844    if (http->host == NULL)
1845    {
1846       /*
1847        * If we still don't know the request destination,
1848        * the request is invalid or the client uses
1849        * Privoxy without its knowledge.
1850        */
1851       if (JB_ERR_OK != get_request_destination_elsewhere(csp, headers))
1852       {
1853          /*
1854           * Our attempts to get the request destination
1855           * elsewhere failed or Privoxy is configured
1856           * to only accept proxy requests.
1857           *
1858           * An error response has already been send
1859           * and we're done here.
1860           */
1861          return JB_ERR_PARSE;
1862       }
1863    }
1864
1865 #ifdef FEATURE_CLIENT_TAGS
1866    /* XXX: If the headers were enlisted sooner, passing csp would do. */
1867    set_client_address(csp, headers);
1868    get_tag_list_for_client(csp->client_tags, csp->client_address);
1869 #endif
1870
1871    /*
1872     * Determine the actions for this URL
1873     */
1874 #ifdef FEATURE_TOGGLE
1875    if (!(csp->flags & CSP_FLAG_TOGGLED_ON))
1876    {
1877       /* Most compatible set of actions (i.e. none) */
1878       init_current_action(csp->action);
1879    }
1880    else
1881 #endif /* ndef FEATURE_TOGGLE */
1882    {
1883       get_url_actions(csp, http);
1884    }
1885
1886    enlist(csp->headers, http->cmd);
1887
1888    /* Append the previously read headers */
1889    err = list_append_list_unique(csp->headers, headers);
1890    destroy_list(headers);
1891
1892    return err;
1893
1894 }
1895
1896
1897 /*********************************************************************
1898  *
1899  * Function    : parse_client_request
1900  *
1901  * Description : Parses the client's request and decides what to do
1902  *               with it.
1903  *
1904  *               Note that since we're not using select() we could get
1905  *               blocked here if a client connected, then didn't say
1906  *               anything!
1907  *
1908  * Parameters  :
1909  *          1  :  csp = Current client state (buffers, headers, etc...)
1910  *
1911  * Returns     :  JB_ERR_OK or JB_ERR_PARSE
1912  *
1913  *********************************************************************/
1914 static jb_err parse_client_request(struct client_state *csp)
1915 {
1916    struct http_request *http = csp->http;
1917    jb_err err;
1918
1919 #ifdef FEATURE_CONNECTION_KEEP_ALIVE
1920    if ((csp->config->feature_flags & RUNTIME_FEATURE_CONNECTION_KEEP_ALIVE)
1921     && (!strcmpic(csp->http->version, "HTTP/1.1"))
1922     && (csp->http->ssl == 0))
1923    {
1924       /* Assume persistence until further notice */
1925       csp->flags |= CSP_FLAG_CLIENT_CONNECTION_KEEP_ALIVE;
1926    }
1927 #endif /* def FEATURE_CONNECTION_KEEP_ALIVE */
1928
1929    if (csp->http->ssl == 0)
1930    {
1931       /*
1932        * This whole block belongs to chat() but currently
1933        * has to be executed before sed().
1934        */
1935       if (csp->flags & CSP_FLAG_CHUNKED_CLIENT_BODY)
1936       {
1937          if (receive_chunked_client_request_body(csp) != JB_ERR_OK)
1938          {
1939             return JB_ERR_PARSE;
1940          }
1941       }
1942       else
1943       {
1944          csp->expected_client_content_length = get_expected_content_length(csp->headers);
1945       }
1946       verify_request_length(csp);
1947    }
1948 #ifndef FEATURE_HTTPS_INSPECTION
1949    else
1950    {
1951       csp->flags |= CSP_FLAG_SERVER_SOCKET_TAINTED;
1952    }
1953 #endif
1954
1955    err = sed(csp, FILTER_CLIENT_HEADERS);
1956    if (JB_ERR_OK != err)
1957    {
1958       log_error(LOG_LEVEL_ERROR, "Failed to parse client request from %s.",
1959          csp->ip_addr_str);
1960       log_error(LOG_LEVEL_CLF, "%s - - [%T] \"%s\" 400 0",
1961          csp->ip_addr_str, csp->http->cmd);
1962       write_socket_delayed(csp->cfd, CHEADER, strlen(CHEADER), get_write_delay(csp));
1963       return JB_ERR_PARSE;
1964    }
1965    csp->flags |= CSP_FLAG_CLIENT_HEADER_PARSING_DONE;
1966
1967    /* Check request line for rewrites. */
1968    if ((NULL == csp->headers->first->str)
1969       || (strcmp(http->cmd, csp->headers->first->str) &&
1970          (JB_ERR_OK != change_request_destination(csp))))
1971    {
1972       /*
1973        * A header filter broke the request line - bail out.
1974        */
1975       write_socket_delayed(csp->cfd, MESSED_UP_REQUEST_RESPONSE,
1976          strlen(MESSED_UP_REQUEST_RESPONSE), get_write_delay(csp));
1977       /* XXX: Use correct size */
1978       log_error(LOG_LEVEL_CLF,
1979          "%s - - [%T] \"Invalid request generated\" 500 0", csp->ip_addr_str);
1980       log_error(LOG_LEVEL_ERROR,
1981          "Invalid request line after applying header filters.");
1982       free_http_request(http);
1983
1984       return JB_ERR_PARSE;
1985    }
1986
1987    if (client_has_unsupported_expectations(csp))
1988    {
1989       return JB_ERR_PARSE;
1990    }
1991
1992    return JB_ERR_OK;
1993
1994 }
1995
1996
1997 /*********************************************************************
1998  *
1999  * Function    : send_http_request
2000  *
2001  * Description : Sends the HTTP headers from the client request
2002  *               and all the body data that has already been received.
2003  *
2004  * Parameters  :
2005  *          1  :  csp = Current client state (buffers, headers, etc...)
2006  *
2007  * Returns     :  0 on success, anything else is an error.
2008  *
2009  *********************************************************************/
2010 static int send_http_request(struct client_state *csp)
2011 {
2012    char *hdr;
2013    int write_failure;
2014
2015    hdr = list_to_text(csp->headers);
2016    if (hdr == NULL)
2017    {
2018       /* FIXME Should handle error properly */
2019       log_error(LOG_LEVEL_FATAL, "Out of memory parsing client header");
2020    }
2021    list_remove_all(csp->headers);
2022
2023    /*
2024     * Write the client's (modified) header to the server
2025     * (along with anything else that may be in the buffer)
2026     */
2027    write_failure = 0 != write_socket(csp->server_connection.sfd, hdr, strlen(hdr));
2028    freez(hdr);
2029
2030    if (write_failure)
2031    {
2032       log_error(LOG_LEVEL_CONNECT, "Failed sending request headers to: %s: %E",
2033          csp->http->hostport);
2034    }
2035    else if (((csp->flags & CSP_FLAG_PIPELINED_REQUEST_WAITING) == 0)
2036       && (flush_iob(csp->server_connection.sfd, csp->client_iob, 0) < 0))
2037    {
2038       write_failure = 1;
2039       log_error(LOG_LEVEL_CONNECT, "Failed sending request body to: %s: %E",
2040          csp->http->hostport);
2041    }
2042
2043    return write_failure;
2044
2045 }
2046
2047
2048 #ifdef FEATURE_HTTPS_INSPECTION
2049 /*********************************************************************
2050  *
2051  * Function    : receive_and_send_encrypted_post_data
2052  *
2053  * Description : Reads remaining POST data from the client and sends
2054  *               it to the server.
2055  *
2056  * Parameters  :
2057  *          1  :  csp = Current client state (buffers, headers, etc...)
2058  *
2059  * Returns     :  0 on success, anything else is an error.
2060  *
2061  *********************************************************************/
2062 static int receive_and_send_encrypted_post_data(struct client_state *csp)
2063 {
2064    int content_length_known = csp->expected_client_content_length != 0;
2065
2066    while (is_ssl_pending(&(csp->ssl_client_attr))
2067       || (content_length_known && csp->expected_client_content_length != 0))
2068    {
2069       unsigned char buf[BUFFER_SIZE];
2070       int len;
2071       int max_bytes_to_read = sizeof(buf);
2072
2073       if (content_length_known && csp->expected_client_content_length < sizeof(buf))
2074       {
2075          max_bytes_to_read = (int)csp->expected_client_content_length;
2076       }
2077       log_error(LOG_LEVEL_CONNECT,
2078          "Waiting for up to %d bytes of POST data from the client.",
2079          max_bytes_to_read);
2080       len = ssl_recv_data(&(csp->ssl_client_attr), buf,
2081          (unsigned)max_bytes_to_read);
2082       if (len == -1)
2083       {
2084          return 1;
2085       }
2086       if (len == 0)
2087       {
2088          /* XXX: Does this actually happen? */
2089          break;
2090       }
2091       log_error(LOG_LEVEL_CONNECT, "Forwarding %d bytes of encrypted POST data",
2092          len);
2093       len = ssl_send_data(&(csp->ssl_server_attr), buf, (size_t)len);
2094       if (len == -1)
2095       {
2096          return 1;
2097       }
2098       if (csp->expected_client_content_length != 0)
2099       {
2100          if (csp->expected_client_content_length >= len)
2101          {
2102             csp->expected_client_content_length -= (unsigned)len;
2103          }
2104          if (csp->expected_client_content_length == 0)
2105          {
2106             log_error(LOG_LEVEL_CONNECT, "Forwarded the last %d bytes", len);
2107             break;
2108          }
2109       }
2110    }
2111
2112    log_error(LOG_LEVEL_CONNECT, "Done forwarding encrypted POST data");
2113
2114    return 0;
2115
2116 }
2117
2118
2119 /*********************************************************************
2120  *
2121  * Function    : send_https_request
2122  *
2123  * Description : Sends the HTTP headers from the client request
2124  *               and all the body data that has already been received.
2125  *
2126  * Parameters  :
2127  *          1  :  csp = Current client state (buffers, headers, etc...)
2128  *
2129  * Returns     :  0 on success, anything else is an error.
2130  *
2131  *********************************************************************/
2132 static int send_https_request(struct client_state *csp)
2133 {
2134    char *hdr;
2135    int ret;
2136    long flushed = 0;
2137
2138    hdr = list_to_text(csp->https_headers);
2139    if (hdr == NULL)
2140    {
2141       /* FIXME Should handle error properly */
2142       log_error(LOG_LEVEL_FATAL, "Out of memory parsing client header");
2143    }
2144    list_remove_all(csp->https_headers);
2145
2146    /*
2147     * Write the client's (modified) header to the server
2148     * (along with anything else that may be in the buffer)
2149     */
2150    ret = ssl_send_data(&(csp->ssl_server_attr),
2151       (const unsigned char *)hdr, strlen(hdr));
2152    freez(hdr);
2153
2154    if (ret < 0)
2155    {
2156       log_error(LOG_LEVEL_CONNECT,
2157          "Failed sending encrypted request headers to: %s: %E",
2158          csp->http->hostport);
2159       mark_server_socket_tainted(csp);
2160       return 1;
2161    }
2162
2163    if (((csp->flags & CSP_FLAG_PIPELINED_REQUEST_WAITING) == 0)
2164       && ((flushed = ssl_flush_socket(&(csp->ssl_server_attr),
2165             csp->client_iob)) < 0))
2166    {
2167       log_error(LOG_LEVEL_CONNECT, "Failed sending request body to: %s: %E",
2168          csp->http->hostport);
2169       return 1;
2170    }
2171    if (flushed != 0 || csp->expected_client_content_length != 0)
2172    {
2173       if (csp->expected_client_content_length != 0)
2174       {
2175          if (csp->expected_client_content_length < flushed)
2176          {
2177             log_error(LOG_LEVEL_ERROR,
2178                "Flushed %ld bytes of request body while only expecting %llu",
2179                flushed, csp->expected_client_content_length);
2180             csp->expected_client_content_length = 0;
2181          }
2182          else
2183          {
2184             log_error(LOG_LEVEL_CONNECT,
2185                "Flushed %ld bytes of request body while expecting %llu",
2186                flushed, csp->expected_client_content_length);
2187             csp->expected_client_content_length -= (unsigned)flushed;
2188             if (receive_and_send_encrypted_post_data(csp))
2189             {
2190                return 1;
2191             }
2192          }
2193       }
2194       else
2195       {
2196          log_error(LOG_LEVEL_CONNECT,
2197             "Flushed %ld bytes of request body", flushed);
2198       }
2199    }
2200
2201    log_error(LOG_LEVEL_CONNECT, "Encrypted request sent");
2202
2203    return 0;
2204
2205 }
2206
2207
2208 /*********************************************************************
2209  *
2210  * Function    :  receive_encrypted_request
2211  *
2212  * Description :  Receives an encrypted request.
2213  *
2214  * Parameters  :
2215  *          1  :  csp = Current client state (buffers, headers, etc...)
2216  *
2217  * Returns     :  JB_ERR_OK on success,
2218  *                JB_ERR_PARSE or JB_ERR_MEMORY otherwise
2219  *
2220  *********************************************************************/
2221 static jb_err receive_encrypted_request(struct client_state *csp)
2222 {
2223    char buf[BUFFER_SIZE];
2224    int len;
2225    char *p;
2226
2227    do
2228    {
2229       log_error(LOG_LEVEL_HEADER, "Reading encrypted headers");
2230       if (!is_ssl_pending(&(csp->ssl_client_attr)) &&
2231           !data_is_available(csp->cfd, csp->config->socket_timeout))
2232       {
2233          log_error(LOG_LEVEL_CONNECT,
2234             "Socket %d timed out while waiting for client headers", csp->cfd);
2235          return JB_ERR_PARSE;
2236       }
2237       len = ssl_recv_data(&(csp->ssl_client_attr),
2238          (unsigned char *)buf, sizeof(buf));
2239       if (len == 0)
2240       {
2241          log_error(LOG_LEVEL_CONNECT,
2242             "Socket %d closed while waiting for client headers", csp->cfd);
2243          return JB_ERR_PARSE;
2244       }
2245       if (len == -1)
2246       {
2247          return JB_ERR_PARSE;
2248       }
2249       if (add_to_iob(csp->client_iob, csp->config->buffer_limit, buf, len))
2250       {
2251          return JB_ERR_MEMORY;
2252       }
2253       p = strstr(csp->client_iob->cur, "\r\n\r\n");
2254    } while (p == NULL);
2255
2256    log_error(LOG_LEVEL_HEADER, "Encrypted headers received completely");
2257
2258    return JB_ERR_OK;
2259 }
2260
2261
2262 /*********************************************************************
2263  *
2264  * Function    :  process_encrypted_request
2265  *
2266  * Description :  Receives and parses an encrypted request.
2267  *
2268  * Parameters  :
2269  *          1  :  csp = Current client state (buffers, headers, etc...)
2270  *
2271  * Returns     :  JB_ERR_OK on success,
2272  *                JB_ERR_PARSE or JB_ERR_MEMORY otherwise
2273  *
2274  *********************************************************************/
2275 static jb_err process_encrypted_request(struct client_state *csp)
2276 {
2277    char *p;
2278    char *request_line;
2279    jb_err err;
2280    /* Temporary copy of the client's headers before they get enlisted in csp->https_headers */
2281    struct list header_list;
2282    struct list *headers = &header_list;
2283
2284    assert(csp->ssl_with_client_is_opened);
2285
2286 #ifdef FEATURE_CONNECTION_KEEP_ALIVE
2287    if (csp->config->feature_flags & RUNTIME_FEATURE_CONNECTION_KEEP_ALIVE)
2288    {
2289       csp->flags |= CSP_FLAG_CLIENT_CONNECTION_KEEP_ALIVE;
2290    }
2291 #endif
2292    err = receive_encrypted_request(csp);
2293    if (err != JB_ERR_OK)
2294    {
2295       if (csp->client_iob->cur == NULL ||
2296           csp->client_iob->cur == csp->client_iob->eod)
2297       {
2298          /*
2299           * We did not receive any data, most likely because the
2300           * client is done. Don't log this as a parse failure.
2301           */
2302          return JB_ERR_PARSE;
2303       }
2304       /* XXX: Also used for JB_ERR_MEMORY */
2305       log_error(LOG_LEVEL_ERROR, "Failed to receive encrypted request: %s",
2306          jb_err_to_string(err));
2307       ssl_send_data_delayed(&(csp->ssl_client_attr),
2308          (const unsigned char *)CHEADER, strlen(CHEADER), get_write_delay(csp));
2309       return err;
2310    }
2311
2312    /* We don't need get_request_line() because the whole HTTP head is buffered. */
2313    request_line = get_header(csp->client_iob);
2314    if (request_line == NULL)
2315    {
2316       log_error(LOG_LEVEL_ERROR, "Failed to get the encrypted request line");
2317       ssl_send_data_delayed(&(csp->ssl_client_attr),
2318          (const unsigned char *)CHEADER, strlen(CHEADER), get_write_delay(csp));
2319       return JB_ERR_PARSE;
2320    }
2321    assert(*request_line != '\0');
2322
2323    if (client_protocol_is_unsupported(csp, request_line))
2324    {
2325       /*
2326        * If the protocol is unsupported we're done here.
2327        * client_protocol_is_unsupported() took care of sending
2328        * the error response and logging the error message.
2329        */
2330       return JB_ERR_PARSE;
2331    }
2332
2333 #ifdef FEATURE_FORCE_LOAD
2334    if (force_required(csp, request_line))
2335    {
2336       csp->flags |= CSP_FLAG_FORCED;
2337    }
2338 #endif /* def FEATURE_FORCE_LOAD */
2339
2340    free_http_request(csp->http);
2341
2342    err = parse_http_request(request_line, csp->http);
2343    /* XXX: Restore ssl setting. This is ugly */
2344    csp->http->client_ssl = 1;
2345    csp->http->server_ssl = 1;
2346
2347    freez(request_line);
2348    if (JB_ERR_OK != err)
2349    {
2350       ssl_send_data_delayed(&(csp->ssl_client_attr),
2351          (const unsigned char *)CHEADER, strlen(CHEADER), get_write_delay(csp));
2352       /* XXX: Use correct size */
2353       log_error(LOG_LEVEL_CLF, "%s - - [%T] \"Invalid request\" 400 0", csp->ip_addr_str);
2354       log_error(LOG_LEVEL_ERROR,
2355          "Couldn't parse request line received from %s: %s",
2356          csp->ip_addr_str, jb_err_to_string(err));
2357
2358       free_http_request(csp->http);
2359       return JB_ERR_PARSE;
2360    }
2361
2362    /* Parse the rest of the client's headers. */
2363    init_list(headers);
2364    for (;;)
2365    {
2366       p = get_header(csp->client_iob);
2367
2368       if (p == NULL)
2369       {
2370          /* There are no additional headers to read. */
2371          break;
2372       }
2373       enlist(headers, p);
2374       freez(p);
2375    }
2376
2377    if (JB_ERR_OK != get_destination_from_https_headers(headers, csp->http))
2378    {
2379       /*
2380        * Our attempts to get the request destination
2381        * elsewhere failed.
2382        */
2383       log_error(LOG_LEVEL_ERROR,
2384          "Failed to get the encrypted request destination");
2385       ssl_send_data_delayed(&(csp->ssl_client_attr),
2386          (const unsigned char *)CHEADER, strlen(CHEADER), get_write_delay(csp));
2387       return JB_ERR_PARSE;
2388    }
2389
2390    /* Split the domain we just got for pattern matching */
2391    init_domain_components(csp->http);
2392
2393 #ifdef FEATURE_CLIENT_TAGS
2394    /* XXX: If the headers were enlisted sooner, passing csp would do. */
2395    if (csp->client_address == NULL)
2396    {
2397       set_client_address(csp, headers);
2398       get_tag_list_for_client(csp->client_tags, csp->client_address);
2399    }
2400 #endif
2401
2402 #ifdef FEATURE_TOGGLE
2403    if ((csp->flags & CSP_FLAG_TOGGLED_ON) != 0)
2404 #endif
2405    {
2406       /*
2407        * Determine the actions for this request after
2408        * clearing the ones from the previous one.
2409        */
2410       free_current_action(csp->action);
2411       get_url_actions(csp, csp->http);
2412    }
2413
2414    enlist(csp->https_headers, csp->http->cmd);
2415
2416    /* Append the previously read headers */
2417    err = list_append_list_unique(csp->https_headers, headers);
2418    destroy_list(headers);
2419    if (JB_ERR_OK != err)
2420    {
2421       /* XXX: Send error message */
2422       return err;
2423    }
2424
2425    /* XXX: Work around crash */
2426    csp->error_message = NULL;
2427
2428    /* XXX: Why do this here? */
2429    csp->http->ssl = 1;
2430
2431    err = sed_https(csp);
2432    if (JB_ERR_OK != err)
2433    {
2434       ssl_send_data_delayed(&(csp->ssl_client_attr),
2435          (const unsigned char *)CHEADER, strlen(CHEADER), get_write_delay(csp));
2436       log_error(LOG_LEVEL_ERROR, "Failed to parse client request from %s.",
2437          csp->ip_addr_str);
2438       log_error(LOG_LEVEL_CLF, "%s - - [%T] \"%s\" 400 0",
2439          csp->ip_addr_str, csp->http->cmd);
2440       return JB_ERR_PARSE;
2441    }
2442
2443    log_error(LOG_LEVEL_HEADER, "Encrypted request processed");
2444    log_applied_actions(csp->action);
2445    log_error(LOG_LEVEL_REQUEST, "https://%s%s", csp->http->hostport,
2446       csp->http->path);
2447
2448    return err;
2449
2450 }
2451
2452 /*********************************************************************
2453  *
2454  * Function    :  cgi_page_requested
2455  *
2456  * Description :  Checks if a request is for an internal CGI page.
2457  *
2458  * Parameters  :
2459  *          1  :  host = The host requested by the client.
2460  *
2461  * Returns     :  1 if a CGI page has been requested, 0 otherwise
2462  *
2463  *********************************************************************/
2464 static int cgi_page_requested(const char *host)
2465 {
2466    if ((0 == strcmpic(host, CGI_SITE_1_HOST))
2467     || (0 == strcmpic(host, CGI_SITE_1_HOST "."))
2468     || (0 == strcmpic(host, CGI_SITE_2_HOST))
2469     || (0 == strcmpic(host, CGI_SITE_2_HOST ".")))
2470    {
2471       return 1;
2472    }
2473
2474    return 0;
2475
2476 }
2477
2478
2479 #ifdef FEATURE_CONNECTION_KEEP_ALIVE
2480 /*********************************************************************
2481  *
2482  * Function    :  continue_https_chat
2483  *
2484  * Description :  Behaves similar to chat() but only deals with
2485  *                https-inspected requests that arrive on an already
2486  *                established connection. The first request is always
2487  *                served by chat() which is a lot more complex as it
2488  *                has to deal with forwarding settings and connection
2489  *                failures etc.
2490  *
2491  *                If a connection to the server has already been
2492  *                opened it is reused unless the request is blocked
2493  *                or the forwarder changed.
2494  *
2495  *                If a connection to the server has not yet been
2496  *                opened (because the previous request was crunched),
2497  *                or the forwarder changed, the connection is dropped
2498  *                so that the client retries on a fresh one.
2499  *
2500  * Parameters  :
2501  *          1  :  csp = Current client state (buffers, headers, etc...)
2502  *
2503  * Returns     :  Nothing.
2504  *
2505  *********************************************************************/
2506 static void continue_https_chat(struct client_state *csp)
2507 {
2508    const struct forward_spec *fwd;
2509
2510    if (JB_ERR_OK != process_encrypted_request(csp))
2511    {
2512       return;
2513    }
2514
2515    csp->requests_received_total++;
2516
2517    /*
2518     * We have an encrypted request. Check if one of the crunchers wants it.
2519     */
2520    if (crunch_response_triggered(csp, crunchers_all))
2521    {
2522       /*
2523        * Yes. The client got the crunch response and we're done here.
2524        */
2525       return;
2526    }
2527    if (csp->ssl_with_server_is_opened == 0)
2528    {
2529       log_error(LOG_LEVEL_CONNECT,
2530          "Dropping the client connection on socket %d. "
2531          "The server connection has not been established yet.",
2532          csp->cfd);
2533       csp->flags &= ~CSP_FLAG_CLIENT_CONNECTION_KEEP_ALIVE;
2534       return;
2535    }
2536    assert(csp->server_connection.sfd != JB_INVALID_SOCKET);
2537
2538    fwd = forward_url(csp, csp->http);
2539    if (!connection_destination_matches(&csp->server_connection, csp->http, fwd))
2540    {
2541       log_error(LOG_LEVEL_CONNECT,
2542          "Dropping the client connection on socket %d with "
2543          "server socket %d connected to %s. The forwarder has changed.",
2544          csp->cfd, csp->server_connection.sfd, csp->server_connection.host);
2545       csp->flags &= ~CSP_FLAG_CLIENT_CONNECTION_KEEP_ALIVE;
2546       return;
2547    }
2548
2549    log_error(LOG_LEVEL_CONNECT,
2550       "Reusing server socket %d connected to %s. Requests already sent: %u.",
2551       csp->server_connection.sfd, csp->server_connection.host,
2552       csp->server_connection.requests_sent_total);
2553
2554    if (send_https_request(csp))
2555    {
2556       /*
2557        * Most likely the server connection timed out. We can't easily
2558        * create a new one so simply drop the client connection without a
2559        * error response to let the client retry.
2560        */
2561       log_error(LOG_LEVEL_CONNECT,
2562          "Dropping client connection on socket %d. "
2563          "Forwarding the encrypted client request failed.",
2564          csp->cfd);
2565       return;
2566    }
2567    csp->server_connection.requests_sent_total++;
2568    handle_established_connection(csp);
2569    freez(csp->receive_buffer);
2570 }
2571 #endif /* def FEATURE_CONNECTION_KEEP_ALIVE */
2572 #endif
2573
2574
2575 /*********************************************************************
2576  *
2577  * Function    :  handle_established_connection
2578  *
2579  * Description :  Shuffle data between client and server once the
2580  *                connection has been established.
2581  *
2582  * Parameters  :
2583  *          1  :  csp = Current client state (buffers, headers, etc...)
2584  *
2585  * Returns     :  Nothing.
2586  *
2587  *********************************************************************/
2588 static void handle_established_connection(struct client_state *csp)
2589 {
2590    char *hdr;
2591    char *p;
2592    int n;
2593 #ifdef HAVE_POLL
2594    struct pollfd poll_fds[2];
2595 #else
2596    fd_set rfds;
2597    jb_socket maxfd;
2598    struct timeval timeout;
2599 #endif
2600    int server_body;
2601    int ms_iis5_hack = 0;
2602    unsigned long long byte_count = 0;
2603    struct http_request *http;
2604    long len = 0; /* for buffer sizes (and negative error codes) */
2605    int buffer_and_filter_content = 0;
2606    unsigned int write_delay;
2607 #ifdef FEATURE_HTTPS_INSPECTION
2608    int ret = 0;
2609    int use_ssl_tunnel = 0;
2610    csp->dont_verify_certificate = 0;
2611
2612    if (csp->http->ssl && !(csp->action->flags & ACTION_HTTPS_INSPECTION))
2613    {
2614       /* Pass encrypted content without filtering. */
2615       use_ssl_tunnel = 1;
2616    }
2617 #endif
2618
2619    /* Skeleton for HTTP response, if we should intercept the request */
2620    struct http_response *rsp;
2621 #ifdef FEATURE_CONNECTION_KEEP_ALIVE
2622    int watch_client_socket;
2623 #endif
2624
2625    csp->receive_buffer_size = csp->config->receive_buffer_size;
2626    csp->receive_buffer = zalloc(csp->receive_buffer_size + 1);
2627    if (csp->receive_buffer == NULL)
2628    {
2629       log_error(LOG_LEVEL_ERROR,
2630          "Out of memory. Failed to allocate the receive buffer.");
2631       rsp = cgi_error_memory();
2632       send_crunch_response(csp, rsp);
2633       return;
2634    }
2635
2636    http = csp->http;
2637
2638 #ifndef HAVE_POLL
2639    maxfd = (csp->cfd > csp->server_connection.sfd) ?
2640       csp->cfd : csp->server_connection.sfd;
2641 #endif
2642
2643    /* pass data between the client and server
2644     * until one or the other shuts down the connection.
2645     */
2646
2647    server_body = 0;
2648
2649 #ifdef FEATURE_CONNECTION_KEEP_ALIVE
2650    watch_client_socket = 0 == (csp->flags & CSP_FLAG_PIPELINED_REQUEST_WAITING);
2651 #endif
2652    write_delay = get_write_delay(csp);
2653
2654    for (;;)
2655    {
2656 #ifndef HAVE_POLL
2657       FD_ZERO(&rfds);
2658 #ifdef FEATURE_CONNECTION_KEEP_ALIVE
2659       if (!watch_client_socket)
2660       {
2661          maxfd = csp->server_connection.sfd;
2662       }
2663       else
2664 #endif /* def FEATURE_CONNECTION_KEEP_ALIVE */
2665       {
2666          FD_SET(csp->cfd, &rfds);
2667       }
2668
2669       FD_SET(csp->server_connection.sfd, &rfds);
2670 #endif /* ndef HAVE_POLL */
2671
2672 #ifdef FEATURE_CONNECTION_KEEP_ALIVE
2673       if ((csp->flags & CSP_FLAG_CHUNKED)
2674          && !(csp->flags & CSP_FLAG_CONTENT_LENGTH_SET)
2675          && ((csp->iob->eod - csp->iob->cur) >= 5)
2676          && !memcmp(csp->iob->eod-5, "0\r\n\r\n", 5))
2677       {
2678          /*
2679           * XXX: This check should be obsolete now,
2680           *      but let's wait a while to be sure.
2681           */
2682          log_error(LOG_LEVEL_CONNECT,
2683             "Looks like we got the last chunk together with "
2684             "the server headers but didn't detect it earlier. "
2685             "We better stop reading.");
2686          byte_count = (unsigned long long)(csp->iob->eod - csp->iob->cur);
2687          csp->expected_content_length = byte_count;
2688          csp->flags |= CSP_FLAG_CONTENT_LENGTH_SET;
2689       }
2690       if (server_body && server_response_is_complete(csp, byte_count))
2691       {
2692          if (csp->expected_content_length == byte_count)
2693          {
2694             log_error(LOG_LEVEL_CONNECT,
2695                "Done reading from server. Content length: %llu as expected. "
2696                "Bytes most recently read: %ld.",
2697                byte_count, len);
2698          }
2699          else
2700          {
2701             log_error(LOG_LEVEL_CONNECT,
2702                "Done reading from server. Expected content length: %llu. "
2703                "Actual content length: %llu. Bytes most recently read: %ld.",
2704                csp->expected_content_length, byte_count, len);
2705          }
2706          len = 0;
2707          /*
2708           * XXX: Should not jump around, handle_established_connection()
2709           * is complicated enough already.
2710           */
2711          goto reading_done;
2712       }
2713 #endif  /* FEATURE_CONNECTION_KEEP_ALIVE */
2714
2715 #ifdef HAVE_POLL
2716       poll_fds[0].fd = csp->cfd;
2717 #ifdef FEATURE_CONNECTION_KEEP_ALIVE
2718       if (!watch_client_socket)
2719       {
2720          /*
2721           * Ignore incoming data, but still watch out
2722           * for disconnects etc. These flags are always
2723           * implied anyway but explicitly setting them
2724           * doesn't hurt.
2725           */
2726          poll_fds[0].events = POLLERR|POLLHUP;
2727       }
2728       else
2729 #endif
2730       {
2731          poll_fds[0].events = POLLIN;
2732       }
2733       poll_fds[1].fd = csp->server_connection.sfd;
2734       poll_fds[1].events = POLLIN;
2735       n = poll(poll_fds, 2, csp->config->socket_timeout * 1000);
2736 #else
2737       timeout.tv_sec = csp->config->socket_timeout;
2738       timeout.tv_usec = 0;
2739       n = select((int)maxfd + 1, &rfds, NULL, NULL, &timeout);
2740 #endif /* def HAVE_POLL */
2741
2742       /*server or client not responding in timeout */
2743       if (n == 0)
2744       {
2745          log_error(LOG_LEVEL_CONNECT, "Socket timeout %d reached: %s",
2746             csp->config->socket_timeout, http->url);
2747          if ((byte_count == 0) && (http->ssl == 0))
2748          {
2749             send_crunch_response(csp, error_response(csp, "connection-timeout"));
2750          }
2751          mark_server_socket_tainted(csp);
2752 #ifdef FEATURE_HTTPS_INSPECTION
2753          close_client_and_server_ssl_connections(csp);
2754 #endif
2755          return;
2756       }
2757       else if (n < 0)
2758       {
2759 #ifdef HAVE_POLL
2760          log_error(LOG_LEVEL_ERROR, "poll() failed!: %E");
2761 #else
2762          log_error(LOG_LEVEL_ERROR, "select() failed!: %E");
2763 #endif
2764          mark_server_socket_tainted(csp);
2765 #ifdef FEATURE_HTTPS_INSPECTION
2766          close_client_and_server_ssl_connections(csp);
2767 #endif
2768          return;
2769       }
2770
2771       /*
2772        * This is the body of the browser's request,
2773        * just read and write it.
2774        *
2775        * Receives data from browser and sends it to server
2776        *
2777        * XXX: Make sure the client doesn't use pipelining
2778        * behind Privoxy's back.
2779        */
2780 #ifdef HAVE_POLL
2781       if ((poll_fds[0].revents & (POLLERR|POLLHUP|POLLNVAL)) != 0)
2782       {
2783          log_error(LOG_LEVEL_CONNECT,
2784             "The client socket %d has become unusable while "
2785             "the server socket %d is still open.",
2786             csp->cfd, csp->server_connection.sfd);
2787          mark_server_socket_tainted(csp);
2788          break;
2789       }
2790
2791       if (poll_fds[0].revents != 0)
2792 #else
2793       if (FD_ISSET(csp->cfd, &rfds))
2794 #endif /* def HAVE_POLL*/
2795       {
2796          int max_bytes_to_read = (int)csp->receive_buffer_size;
2797
2798 #ifdef FEATURE_CONNECTION_KEEP_ALIVE
2799          if ((csp->flags & CSP_FLAG_CLIENT_REQUEST_COMPLETELY_READ))
2800          {
2801             if (data_is_available(csp->cfd, 0))
2802             {
2803                /*
2804                 * If the next request is already waiting, we have
2805                 * to stop select()ing the client socket. Otherwise
2806                 * we would always return right away and get nothing
2807                 * else done.
2808                 */
2809                watch_client_socket = 0;
2810                log_error(LOG_LEVEL_CONNECT,
2811                   "Stop watching client socket %d. "
2812                   "There's already another request waiting.",
2813                   csp->cfd);
2814                continue;
2815             }
2816             /*
2817              * If the client socket is set, but there's no data
2818              * available on the socket, the client went fishing
2819              * and continuing talking to the server makes no sense.
2820              */
2821             log_error(LOG_LEVEL_CONNECT,
2822                "The client closed socket %d while "
2823                "the server socket %d is still open.",
2824                csp->cfd, csp->server_connection.sfd);
2825             mark_server_socket_tainted(csp);
2826             break;
2827          }
2828          if (csp->expected_client_content_length != 0)
2829          {
2830             if (csp->expected_client_content_length < csp->receive_buffer_size)
2831             {
2832                max_bytes_to_read = (int)csp->expected_client_content_length;
2833             }
2834             log_error(LOG_LEVEL_CONNECT,
2835                "Waiting for up to %d bytes from the client.",
2836                max_bytes_to_read);
2837          }
2838          assert(max_bytes_to_read <= csp->receive_buffer_size);
2839 #endif /* def FEATURE_CONNECTION_KEEP_ALIVE */
2840
2841 #ifdef FEATURE_HTTPS_INSPECTION
2842          if (client_use_ssl(csp))
2843          {
2844             if (csp->http->status == 101)
2845             {
2846                len = ssl_recv_data(&(csp->ssl_client_attr),
2847                   (unsigned char *)csp->receive_buffer,
2848                   (size_t)max_bytes_to_read);
2849                if (len == -1)
2850                {
2851                   log_error(LOG_LEVEL_ERROR, "Failed to receive data "
2852                      "on client socket %d for an upgraded connection",
2853                      csp->cfd);
2854                   break;
2855                }
2856                if (len == 0)
2857                {
2858                   log_error(LOG_LEVEL_CONNECT, "Done receiving data "
2859                      "on client socket %d for an upgraded connection",
2860                      csp->cfd);
2861                   break;
2862                }
2863                byte_count += (unsigned long long)len;
2864                len = ssl_send_data(&(csp->ssl_server_attr),
2865                   (unsigned char *)csp->receive_buffer, (size_t)len);
2866                if (len == -1)
2867                {
2868                   log_error(LOG_LEVEL_ERROR, "Failed to send data "
2869                      "on server socket %d for an upgraded connection",
2870                      csp->server_connection.sfd);
2871                   break;
2872                }
2873                continue;
2874             }
2875             log_error(LOG_LEVEL_CONNECT, "Breaking with TLS/SSL.");
2876             break;
2877          }
2878          else
2879 #endif /* def FEATURE_HTTPS_INSPECTION */
2880          {
2881             len = read_socket(csp->cfd, csp->receive_buffer, max_bytes_to_read);
2882
2883             if (len <= 0)
2884             {
2885                /* XXX: not sure if this is necessary. */
2886                mark_server_socket_tainted(csp);
2887                break; /* "game over, man" */
2888             }
2889
2890 #ifdef FEATURE_CONNECTION_KEEP_ALIVE
2891             if (csp->expected_client_content_length != 0)
2892             {
2893                assert(len <= max_bytes_to_read);
2894                csp->expected_client_content_length -= (unsigned)len;
2895                log_error(LOG_LEVEL_CONNECT,
2896                   "Expected client content length set to %llu "
2897                   "after reading %ld bytes.",
2898                   csp->expected_client_content_length, len);
2899                if (csp->expected_client_content_length == 0)
2900                {
2901                   log_error(LOG_LEVEL_CONNECT,
2902                      "Done reading from the client.");
2903                   csp->flags |= CSP_FLAG_CLIENT_REQUEST_COMPLETELY_READ;
2904                }
2905             }
2906 #endif /* def FEATURE_CONNECTION_KEEP_ALIVE */
2907
2908             if (write_socket(csp->server_connection.sfd, csp->receive_buffer, (size_t)len))
2909             {
2910                log_error(LOG_LEVEL_ERROR, "write to: %s failed: %E", http->host);
2911                mark_server_socket_tainted(csp);
2912                return;
2913             }
2914          }
2915          continue;
2916       }
2917
2918       /*
2919        * The server wants to talk. It could be the header or the body.
2920        * If `hdr' is null, then it's the header otherwise it's the body.
2921        * FIXME: Does `hdr' really mean `host'? No.
2922        */
2923 #ifdef HAVE_POLL
2924       if (poll_fds[1].revents != 0)
2925 #else
2926       if (FD_ISSET(csp->server_connection.sfd, &rfds))
2927 #endif /* HAVE_POLL */
2928       {
2929 #ifdef FEATURE_CONNECTION_KEEP_ALIVE
2930          /*
2931           * If we are buffering content, we don't want to eat up to
2932           * buffer-limit bytes if the client no longer cares about them.
2933           * If we aren't buffering, however, a dead client socket will be
2934           * noticed pretty much right away anyway, so we can reduce the
2935           * overhead by skipping the check.
2936           */
2937          if (buffer_and_filter_content && !socket_is_still_alive(csp->cfd))
2938          {
2939 #ifdef _WIN32
2940             log_error(LOG_LEVEL_CONNECT,
2941                "The server still wants to talk, but the client may already have hung up on us.");
2942 #else
2943             log_error(LOG_LEVEL_CONNECT,
2944                "The server still wants to talk, but the client hung up on us.");
2945             mark_server_socket_tainted(csp);
2946 #ifdef FEATURE_HTTPS_INSPECTION
2947             close_client_and_server_ssl_connections(csp);
2948 #endif
2949             return;
2950 #endif /* def _WIN32 */
2951          }
2952 #endif /* def FEATURE_CONNECTION_KEEP_ALIVE */
2953
2954 #ifdef FEATURE_HTTPS_INSPECTION
2955          /*
2956           * Reading data from standard or secured connection (HTTP/HTTPS)
2957           */
2958          if (server_use_ssl(csp))
2959          {
2960             len = ssl_recv_data(&(csp->ssl_server_attr),
2961                (unsigned char *)csp->receive_buffer, csp->receive_buffer_size);
2962          }
2963          else
2964 #endif
2965          {
2966             len = read_socket(csp->server_connection.sfd, csp->receive_buffer,
2967                (int)csp->receive_buffer_size);
2968          }
2969
2970          if (len < 0)
2971          {
2972             log_error(LOG_LEVEL_ERROR, "read from: %s failed: %E", http->host);
2973
2974             if ((http->ssl && (csp->fwd == NULL))
2975 #ifdef FEATURE_HTTPS_INSPECTION
2976                && use_ssl_tunnel
2977 #endif
2978                 )
2979             {
2980                /*
2981                 * Just hang up. We already confirmed the client's CONNECT
2982                 * request with status code 200 and unencrypted content is
2983                 * no longer welcome.
2984                 */
2985                log_error(LOG_LEVEL_ERROR,
2986                   "CONNECT already confirmed. Unable to tell the client about the problem.");
2987                return;
2988             }
2989             else if (byte_count)
2990             {
2991                /*
2992                 * Just hang up. We already transmitted the original headers
2993                 * and parts of the original content and therefore missed the
2994                 * chance to send an error message (without risking data corruption).
2995                 *
2996                 * XXX: we could retry with a fancy range request here.
2997                 */
2998                log_error(LOG_LEVEL_ERROR, "Already forwarded the original headers. "
2999                   "Unable to tell the client about the problem.");
3000                mark_server_socket_tainted(csp);
3001 #ifdef FEATURE_HTTPS_INSPECTION
3002                close_client_and_server_ssl_connections(csp);
3003 #endif
3004                return;
3005             }
3006             /*
3007              * XXX: Consider handling the cases above the same.
3008              */
3009             mark_server_socket_tainted(csp);
3010             len = 0;
3011          }
3012
3013 #ifdef FEATURE_CONNECTION_KEEP_ALIVE
3014          if (csp->flags & CSP_FLAG_CHUNKED)
3015          {
3016             if ((len >= 5) && !memcmp(csp->receive_buffer+len-5, "0\r\n\r\n", 5))
3017             {
3018                /* XXX: this is a temporary hack */
3019                log_error(LOG_LEVEL_CONNECT,
3020                   "Looks like we reached the end of the last chunk. "
3021                   "We better stop reading.");
3022                csp->expected_content_length = byte_count + (unsigned long long)len;
3023                csp->flags |= CSP_FLAG_CONTENT_LENGTH_SET;
3024             }
3025          }
3026          reading_done:
3027 #endif  /* FEATURE_CONNECTION_KEEP_ALIVE */
3028
3029          /*
3030           * This is guaranteed by allocating with zalloc_or_die()
3031           * and never (intentionally) writing to the last byte.
3032           *
3033           * csp->receive_buffer_size is the size of the part of the
3034           * buffer we intentionally write to, but we actually
3035           * allocated csp->receive_buffer_size+1 bytes so the assertion
3036           * stays within the allocated range.
3037           */
3038          assert(csp->receive_buffer[csp->receive_buffer_size] == '\0');
3039
3040          /*
3041           * Add a trailing zero to let be able to use string operations.
3042           * XXX: do we still need this with filter_popups gone?
3043           */
3044          assert(len <= csp->receive_buffer_size);
3045          csp->receive_buffer[len] = '\0';
3046
3047          /*
3048           * Normally, this would indicate that we've read
3049           * as much as the server has sent us and we can
3050           * close the client connection.  However, Microsoft
3051           * in its wisdom has released IIS/5 with a bug that
3052           * prevents it from sending the trailing \r\n in
3053           * a 302 redirect header (and possibly other headers).
3054           * To work around this if we've haven't parsed
3055           * a full header we'll append a trailing \r\n
3056           * and see if this now generates a valid one.
3057           *
3058           * This hack shouldn't have any impacts.  If we've
3059           * already transmitted the header or if this is a
3060           * SSL connection, then we won't bother with this
3061           * hack.  So we only work on partially received
3062           * headers.  If we append a \r\n and this still
3063           * doesn't generate a valid header, then we won't
3064           * transmit anything to the client.
3065           */
3066          if (len == 0)
3067          {
3068
3069             if (server_body || (http->ssl
3070 #ifdef FEATURE_HTTPS_INSPECTION
3071                   && use_ssl_tunnel
3072 #endif
3073                ))
3074             {
3075                /*
3076                 * If we have been buffering up the document,
3077                 * now is the time to apply content modification
3078                 * and send the result to the client.
3079                 */
3080                if (buffer_and_filter_content)
3081                {
3082                   p = execute_content_filters(csp);
3083                   /*
3084                    * If content filtering fails, use the original
3085                    * buffer and length.
3086                    * (see p != NULL ? p : csp->iob->cur below)
3087                    */
3088                   if (NULL == p)
3089                   {
3090                      csp->content_length = (size_t)(csp->iob->eod - csp->iob->cur);
3091                   }
3092 #ifdef FEATURE_COMPRESSION
3093                   else if ((csp->flags & CSP_FLAG_CLIENT_SUPPORTS_DEFLATE)
3094                      && (csp->content_length > LOWER_LENGTH_LIMIT_FOR_COMPRESSION))
3095                   {
3096                      char *compressed_content = compress_buffer(p,
3097                         (size_t *)&csp->content_length, csp->config->compression_level);
3098                      if (compressed_content != NULL)
3099                      {
3100                         freez(p);
3101                         p = compressed_content;
3102                         csp->flags |= CSP_FLAG_BUFFERED_CONTENT_DEFLATED;
3103                      }
3104                   }
3105 #endif
3106
3107                   if (JB_ERR_OK != update_server_headers(csp))
3108                   {
3109                      log_error(LOG_LEVEL_FATAL,
3110                         "Failed to update server headers. after filtering.");
3111                   }
3112
3113                   hdr = list_to_text(csp->headers);
3114                   if (hdr == NULL)
3115                   {
3116                      /* FIXME Should handle error properly */
3117                      log_error(LOG_LEVEL_FATAL, "Out of memory parsing server header");
3118                   }
3119
3120 #ifdef FEATURE_HTTPS_INSPECTION
3121                   /*
3122                    * Sending data with standard or secured connection (HTTP/HTTPS)
3123                    */
3124                   if (client_use_ssl(csp))
3125                   {
3126                      if ((ssl_send_data_delayed(&(csp->ssl_client_attr),
3127                               (const unsigned char *)hdr, strlen(hdr),
3128                               get_write_delay(csp)) < 0)
3129                         || (ssl_send_data_delayed(&(csp->ssl_client_attr),
3130                               (const unsigned char *) ((p != NULL) ? p : csp->iob->cur),
3131                               csp->content_length, get_write_delay(csp)) < 0))
3132                      {
3133                         log_error(LOG_LEVEL_ERROR, "write modified content to "
3134                            "client over TLS/SSL failed");
3135                         freez(hdr);
3136                         freez(p);
3137                         mark_server_socket_tainted(csp);
3138                         close_client_and_server_ssl_connections(csp);
3139                         return;
3140                      }
3141                   }
3142                   else
3143 #endif /* def FEATURE_HTTPS_INSPECTION */
3144                   {
3145                      if (write_socket_delayed(csp->cfd, hdr, strlen(hdr), write_delay)
3146                       || write_socket_delayed(csp->cfd, ((p != NULL) ? p : csp->iob->cur),
3147                          (size_t)csp->content_length, write_delay))
3148                      {
3149                         log_error(LOG_LEVEL_ERROR, "write modified content to client failed: %E");
3150                         freez(hdr);
3151                         freez(p);
3152                         mark_server_socket_tainted(csp);
3153                         return;
3154                      }
3155                   }
3156
3157                   freez(hdr);
3158                   freez(p);
3159                }
3160
3161                break; /* "game over, man" */
3162             }
3163
3164             /*
3165              * This is NOT the body, so
3166              * Let's pretend the server just sent us a blank line.
3167              */
3168             snprintf(csp->receive_buffer, csp->receive_buffer_size, "\r\n");
3169             len = (int)strlen(csp->receive_buffer);
3170
3171             /*
3172              * Now, let the normal header parsing algorithm below do its
3173              * job.  If it fails, we'll exit instead of continuing.
3174              */
3175
3176             ms_iis5_hack = 1;
3177          }
3178
3179          /*
3180           * If we're in the body of the server document, just write it to
3181           * the client, unless we need to buffer the body for later
3182           * content-filtering.
3183           */
3184          if (server_body || (http->ssl
3185 #ifdef FEATURE_HTTPS_INSPECTION
3186                && use_ssl_tunnel
3187 #endif
3188             ))
3189          {
3190             if (buffer_and_filter_content)
3191             {
3192                /*
3193                 * If there is no memory left for buffering the content, or the buffer limit
3194                 * has been reached, switch to non-filtering mode, i.e. make & write the
3195                 * header, flush the iob and buf, and get out of the way.
3196                 */
3197                if (add_to_iob(csp->iob, csp->config->buffer_limit, csp->receive_buffer, len))
3198                {
3199                   size_t hdrlen;
3200                   long flushed;
3201
3202                   log_error(LOG_LEVEL_INFO,
3203                      "Flushing header and buffers. Stepping back from filtering.");
3204
3205                   hdr = list_to_text(csp->headers);
3206                   if (hdr == NULL)
3207                   {
3208                      /*
3209                       * Memory is too tight to even generate the header.
3210                       * Send our static "Out-of-memory" page.
3211                       */
3212                      log_error(LOG_LEVEL_ERROR, "Out of memory while trying to flush.");
3213                      rsp = cgi_error_memory();
3214                      send_crunch_response(csp, rsp);
3215                      mark_server_socket_tainted(csp);
3216 #ifdef FEATURE_HTTPS_INSPECTION
3217                      close_client_and_server_ssl_connections(csp);
3218 #endif
3219                      return;
3220                   }
3221                   hdrlen = strlen(hdr);
3222
3223 #ifdef FEATURE_HTTPS_INSPECTION
3224                   /*
3225                    * Sending data with standard or secured connection (HTTP/HTTPS)
3226                    */
3227                   if (client_use_ssl(csp))
3228                   {
3229                      if ((ssl_send_data_delayed(&(csp->ssl_client_attr),
3230                              (const unsigned char *)hdr, hdrlen, get_write_delay(csp)) < 0)
3231                         || ((flushed = ssl_flush_socket(&(csp->ssl_client_attr),
3232                                 csp->iob)) < 0)
3233                         || (ssl_send_data_delayed(&(csp->ssl_client_attr),
3234                               (const unsigned char *)csp->receive_buffer, (size_t)len,
3235                               get_write_delay(csp)) < 0))
3236                      {
3237                         log_error(LOG_LEVEL_CONNECT,
3238                            "Flush header and buffers to client failed");
3239                         freez(hdr);
3240                         mark_server_socket_tainted(csp);
3241                         close_client_and_server_ssl_connections(csp);
3242                         return;
3243                      }
3244                   }
3245                   else
3246 #endif /* def FEATURE_HTTPS_INSPECTION */
3247                   {
3248                      if (write_socket_delayed(csp->cfd, hdr, hdrlen, write_delay)
3249                       || ((flushed = flush_iob(csp->cfd, csp->iob, write_delay)) < 0)
3250                       || write_socket_delayed(csp->cfd, csp->receive_buffer, (size_t)len,
3251                             write_delay))
3252                      {
3253                         log_error(LOG_LEVEL_CONNECT,
3254                            "Flush header and buffers to client failed: %E");
3255                         freez(hdr);
3256                         mark_server_socket_tainted(csp);
3257                         return;
3258                      }
3259                   }
3260
3261                   /*
3262                    * Reset the byte_count to the amount of bytes
3263                    * we just flushed. len will be added a few lines below,
3264                    * hdrlen doesn't matter for LOG_LEVEL_CLF.
3265                    */
3266                   byte_count = (unsigned long long)flushed;
3267                   freez(hdr);
3268                   buffer_and_filter_content = 0;
3269                   server_body = 1;
3270                }
3271             }
3272             else
3273             {
3274 #ifdef FEATURE_HTTPS_INSPECTION
3275                /*
3276                 * Sending data with standard or secured connection (HTTP/HTTPS)
3277                 */
3278                if (client_use_ssl(csp))
3279                {
3280                   ret = ssl_send_data_delayed(&(csp->ssl_client_attr),
3281                      (const unsigned char *)csp->receive_buffer, (size_t)len,
3282                      get_write_delay(csp));
3283                   if (ret < 0)
3284                   {
3285                      log_error(LOG_LEVEL_ERROR,
3286                         "Sending data to client failed");
3287                      mark_server_socket_tainted(csp);
3288                      close_client_and_server_ssl_connections(csp);
3289                      return;
3290                   }
3291                }
3292                else
3293 #endif /* def FEATURE_HTTPS_INSPECTION */
3294                {
3295                   if (write_socket_delayed(csp->cfd, csp->receive_buffer,
3296                         (size_t)len, write_delay))
3297                   {
3298                      log_error(LOG_LEVEL_ERROR, "write to client failed: %E");
3299                      mark_server_socket_tainted(csp);
3300                      return;
3301                   }
3302                }
3303             }
3304             byte_count += (unsigned long long)len;
3305             continue;
3306          }
3307          else
3308          {
3309             /*
3310              * We're still looking for the end of the server's header.
3311              * Buffer up the data we just read.  If that fails, there's
3312              * little we can do but send our static out-of-memory page.
3313              */
3314             if (add_to_iob(csp->iob, csp->config->buffer_limit, csp->receive_buffer, len))
3315             {
3316                log_error(LOG_LEVEL_ERROR, "Out of memory while looking for end of server headers.");
3317                rsp = cgi_error_memory();
3318                send_crunch_response(csp, rsp);
3319                mark_server_socket_tainted(csp);
3320 #ifdef FEATURE_HTTPS_INSPECTION
3321                close_client_and_server_ssl_connections(csp);
3322 #endif
3323                return;
3324             }
3325
3326             /* Convert iob into something sed() can digest */
3327             if (JB_ERR_PARSE == get_server_headers(csp))
3328             {
3329                if (ms_iis5_hack)
3330                {
3331                   /*
3332                    * Well, we tried our MS IIS/5 hack and it didn't work.
3333                    * The header is incomplete and there isn't anything
3334                    * we can do about it.
3335                    */
3336                   log_error(LOG_LEVEL_ERROR, "Invalid server headers. "
3337                      "Applying the MS IIS5 hack didn't help.");
3338                   log_error(LOG_LEVEL_CLF,
3339                      "%s - - [%T] \"%s\" 502 0", csp->ip_addr_str, http->cmd);
3340 #ifdef FEATURE_HTTPS_INSPECTION
3341                   /*
3342                    * Sending data with standard or secured connection (HTTP/HTTPS)
3343                    */
3344                   if (client_use_ssl(csp))
3345                   {
3346                      ssl_send_data_delayed(&(csp->ssl_client_attr),
3347                         (const unsigned char *)INVALID_SERVER_HEADERS_RESPONSE,
3348                         strlen(INVALID_SERVER_HEADERS_RESPONSE), get_write_delay(csp));
3349                   }
3350                   else
3351 #endif /* def FEATURE_HTTPS_INSPECTION */
3352                   {
3353                      write_socket_delayed(csp->cfd,
3354                         INVALID_SERVER_HEADERS_RESPONSE,
3355                         strlen(INVALID_SERVER_HEADERS_RESPONSE), write_delay);
3356                   }
3357                   mark_server_socket_tainted(csp);
3358 #ifdef FEATURE_HTTPS_INSPECTION
3359                   close_client_and_server_ssl_connections(csp);
3360 #endif
3361                   return;
3362                }
3363                else
3364                {
3365                   /*
3366                    * Since we have to wait for more from the server before
3367                    * we can parse the headers we just continue here.
3368                    */
3369                   log_error(LOG_LEVEL_CONNECT,
3370                      "Continuing buffering server headers from socket %d. "
3371                      "Bytes most recently read: %ld.", csp->cfd, len);
3372                   continue;
3373                }
3374             }
3375             else
3376             {
3377                /*
3378                 * Account for the content bytes we
3379                 * might have gotten with the headers.
3380                 */
3381                assert(csp->iob->eod >= csp->iob->cur);
3382                byte_count = (unsigned long long)(csp->iob->eod - csp->iob->cur);
3383             }
3384
3385             /* Did we actually get anything? */
3386             if (NULL == csp->headers->first)
3387             {
3388                if ((csp->flags & CSP_FLAG_REUSED_CLIENT_CONNECTION))
3389                {
3390                   log_error(LOG_LEVEL_ERROR,
3391                      "No server or forwarder response received on socket %d. "
3392                      "Closing client socket %d without sending data.",
3393                      csp->server_connection.sfd, csp->cfd);
3394                   log_error(LOG_LEVEL_CLF,
3395                      "%s - - [%T] \"%s\" 502 0", csp->ip_addr_str, http->cmd);
3396                }
3397                else
3398                {
3399                   log_error(LOG_LEVEL_ERROR,
3400                      "No server or forwarder response received on socket %d.",
3401                      csp->server_connection.sfd);
3402                   send_crunch_response(csp, error_response(csp, "no-server-data"));
3403                }
3404                free_http_request(http);
3405                mark_server_socket_tainted(csp);
3406 #ifdef FEATURE_HTTPS_INSPECTION
3407                close_client_and_server_ssl_connections(csp);
3408 #endif
3409                return;
3410             }
3411
3412             if (!csp->headers->first->str)
3413             {
3414                log_error(LOG_LEVEL_ERROR, "header search: csp->headers->first->str == NULL, assert will be called");
3415             }
3416             assert(csp->headers->first->str);
3417
3418             if (strncmpic(csp->headers->first->str, "HTTP", 4) &&
3419                 strncmpic(csp->headers->first->str, "ICY", 3))
3420             {
3421                /*
3422                 * It doesn't look like a HTTP (or Shoutcast) response:
3423                 * tell the client and log the problem.
3424                 */
3425                if (strlen(csp->headers->first->str) > 30)
3426                {
3427                   csp->headers->first->str[30] = '\0';
3428                }
3429                log_error(LOG_LEVEL_ERROR,
3430                   "Invalid server or forwarder response. Starts with: %s",
3431                   csp->headers->first->str);
3432                log_error(LOG_LEVEL_CLF,
3433                   "%s - - [%T] \"%s\" 502 0", csp->ip_addr_str, http->cmd);
3434 #ifdef FEATURE_HTTPS_INSPECTION
3435                /*
3436                 * Sending data with standard or secured connection (HTTP/HTTPS)
3437                 */
3438                if (client_use_ssl(csp))
3439                {
3440                   ssl_send_data_delayed(&(csp->ssl_client_attr),
3441                      (const unsigned char *)INVALID_SERVER_HEADERS_RESPONSE,
3442                      strlen(INVALID_SERVER_HEADERS_RESPONSE),
3443                      get_write_delay(csp));
3444                }
3445                else
3446 #endif /* def FEATURE_HTTPS_INSPECTION */
3447                {
3448                   write_socket_delayed(csp->cfd, INVALID_SERVER_HEADERS_RESPONSE,
3449                      strlen(INVALID_SERVER_HEADERS_RESPONSE), write_delay);
3450                }
3451                free_http_request(http);
3452                mark_server_socket_tainted(csp);
3453 #ifdef FEATURE_HTTPS_INSPECTION
3454                close_client_and_server_ssl_connections(csp);
3455 #endif
3456                return;
3457             }
3458
3459             /*
3460              * We have now received the entire server header,
3461              * filter it and send the result to the client
3462              */
3463             if (JB_ERR_OK != sed(csp, FILTER_SERVER_HEADERS))
3464             {
3465                log_error(LOG_LEVEL_CLF,
3466                   "%s - - [%T] \"%s\" 502 0", csp->ip_addr_str, http->cmd);
3467 #ifdef FEATURE_HTTPS_INSPECTION
3468                /*
3469                 * Sending data with standard or secured connection (HTTP/HTTPS)
3470                 */
3471                if (client_use_ssl(csp))
3472                {
3473                   ssl_send_data_delayed(&(csp->ssl_client_attr),
3474                      (const unsigned char *)INVALID_SERVER_HEADERS_RESPONSE,
3475                      strlen(INVALID_SERVER_HEADERS_RESPONSE),
3476                      get_write_delay(csp));
3477                }
3478                else
3479 #endif
3480                {
3481                   write_socket_delayed(csp->cfd, INVALID_SERVER_HEADERS_RESPONSE,
3482                      strlen(INVALID_SERVER_HEADERS_RESPONSE), write_delay);
3483                }
3484                free_http_request(http);
3485                mark_server_socket_tainted(csp);
3486 #ifdef FEATURE_HTTPS_INSPECTION
3487                close_client_and_server_ssl_connections(csp);
3488 #endif
3489                return;
3490             }
3491             hdr = list_to_text(csp->headers);
3492             if (hdr == NULL)
3493             {
3494                /* FIXME Should handle error properly */
3495                log_error(LOG_LEVEL_FATAL, "Out of memory parsing server header");
3496             }
3497
3498             if ((csp->flags & CSP_FLAG_CHUNKED)
3499                && !(csp->flags & CSP_FLAG_CONTENT_LENGTH_SET)
3500                && ((csp->iob->eod - csp->iob->cur) >= 5)
3501                && !memcmp(csp->iob->eod-5, "0\r\n\r\n", 5))
3502             {
3503                log_error(LOG_LEVEL_CONNECT,
3504                   "Looks like we got the last chunk together with "
3505                   "the server headers. We better stop reading.");
3506                byte_count = (unsigned long long)(csp->iob->eod - csp->iob->cur);
3507                csp->expected_content_length = byte_count;
3508                csp->flags |= CSP_FLAG_CONTENT_LENGTH_SET;
3509             }
3510
3511             csp->server_connection.response_received = time(NULL);
3512
3513             if (crunch_response_triggered(csp, crunchers_light))
3514             {
3515                /*
3516                 * One of the tags created by a server-header
3517                 * tagger triggered a crunch. We already
3518                 * delivered the crunch response to the client
3519                 * and are done here after cleaning up.
3520                 */
3521                freez(hdr);
3522                mark_server_socket_tainted(csp);
3523 #ifdef FEATURE_HTTPS_INSPECTION
3524                close_client_and_server_ssl_connections(csp);
3525 #endif
3526                return;
3527             }
3528
3529             /* Buffer and pcrs filter this if appropriate. */
3530             buffer_and_filter_content = content_requires_filtering(csp);
3531
3532             if (!buffer_and_filter_content)
3533             {
3534                /*
3535                 * Write the server's (modified) header to
3536                 * the client (along with anything else that
3537                 * may be in the buffer). Use standard or secured
3538                 * connection.
3539                 */
3540 #ifdef FEATURE_HTTPS_INSPECTION
3541                if (client_use_ssl(csp))
3542                {
3543                   if ((ssl_send_data_delayed(&(csp->ssl_client_attr),
3544                           (const unsigned char *)hdr, strlen(hdr),
3545                           get_write_delay(csp)) < 0)
3546                      || (len = ssl_flush_socket(&(csp->ssl_client_attr),
3547                             csp->iob) < 0))
3548                   {
3549                      log_error(LOG_LEVEL_CONNECT, "Write header to client failed");
3550
3551                      /*
3552                       * The write failed, so don't bother mentioning it
3553                       * to the client... it probably can't hear us anyway.
3554                       */
3555                      freez(hdr);
3556                      mark_server_socket_tainted(csp);
3557 #ifdef FEATURE_HTTPS_INSPECTION
3558                      close_client_and_server_ssl_connections(csp);
3559 #endif
3560                      return;
3561                   }
3562                }
3563                else
3564 #endif /* def FEATURE_HTTPS_INSPECTION */
3565                {
3566                   if (write_socket_delayed(csp->cfd, hdr, strlen(hdr), write_delay)
3567                      || ((len = flush_iob(csp->cfd, csp->iob, write_delay)) < 0))
3568                   {
3569                      log_error(LOG_LEVEL_ERROR,
3570                         "write header to client failed");
3571                      /*
3572                       * The write failed, so don't bother mentioning it
3573                       * to the client... it probably can't hear us anyway.
3574                       */
3575                      freez(hdr);
3576                      mark_server_socket_tainted(csp);
3577                      return;
3578                   }
3579                }
3580                                 }
3581
3582             /* we're finished with the server's header */
3583
3584             freez(hdr);
3585             server_body = 1;
3586
3587             /*
3588              * If this was a MS IIS/5 hack then it means the server
3589              * has already closed the connection. Nothing more to read.
3590              * Time to bail.
3591              */
3592             if (ms_iis5_hack)
3593             {
3594                log_error(LOG_LEVEL_ERROR,
3595                   "Closed server connection detected. "
3596                   "Applying the MS IIS5 hack didn't help.");
3597                log_error(LOG_LEVEL_CLF,
3598                   "%s - - [%T] \"%s\" 502 0", csp->ip_addr_str, http->cmd);
3599 #ifdef FEATURE_HTTPS_INSPECTION
3600                /*
3601                 * Sending data with standard or secured connection (HTTP/HTTPS)
3602                 */
3603                if (client_use_ssl(csp))
3604                {
3605                   ssl_send_data_delayed(&(csp->ssl_client_attr),
3606                      (const unsigned char *)INVALID_SERVER_HEADERS_RESPONSE,
3607                      strlen(INVALID_SERVER_HEADERS_RESPONSE),
3608                      get_write_delay(csp));
3609                }
3610                else
3611 #endif /* def FEATURE_HTTPS_INSPECTION */
3612                {
3613                   write_socket_delayed(csp->cfd, INVALID_SERVER_HEADERS_RESPONSE,
3614                      strlen(INVALID_SERVER_HEADERS_RESPONSE), write_delay);
3615                }
3616                mark_server_socket_tainted(csp);
3617 #ifdef FEATURE_HTTPS_INSPECTION
3618                close_client_and_server_ssl_connections(csp);
3619 #endif
3620                return;
3621             }
3622          }
3623          continue;
3624       }
3625       mark_server_socket_tainted(csp);
3626 #ifdef FEATURE_HTTPS_INSPECTION
3627       close_client_and_server_ssl_connections(csp);
3628 #endif
3629       return; /* huh? we should never get here */
3630    }
3631
3632    if (csp->content_length == 0)
3633    {
3634       /*
3635        * If Privoxy didn't recalculate the Content-Length,
3636        * byte_count is still correct.
3637        */
3638       csp->content_length = byte_count;
3639    }
3640
3641 #ifdef FEATURE_CONNECTION_KEEP_ALIVE
3642    if ((csp->flags & CSP_FLAG_CONTENT_LENGTH_SET)
3643       && (csp->expected_content_length != byte_count))
3644    {
3645       log_error(LOG_LEVEL_CONNECT,
3646          "Received %llu bytes while expecting %llu.",
3647          byte_count, csp->expected_content_length);
3648       mark_server_socket_tainted(csp);
3649    }
3650 #endif
3651
3652 #ifdef FEATURE_HTTPS_INSPECTION
3653    if (client_use_ssl(csp))
3654    {
3655       log_error(LOG_LEVEL_CLF, "%s - - [%T] \"%s https://%s%s %s\" 200 %llu",
3656          csp->ip_addr_str, http->gpc, http->hostport, http->path,
3657          http->version, csp->content_length);
3658    }
3659    else
3660 #endif
3661    {
3662       log_error(LOG_LEVEL_CLF, "%s - - [%T] \"%s\" 200 %llu",
3663          csp->ip_addr_str, http->ocmd, csp->content_length);
3664    }
3665    csp->server_connection.timestamp = time(NULL);
3666 }
3667
3668
3669 /*********************************************************************
3670  *
3671  * Function    :  chat
3672  *
3673  * Description :  Once a connection from the client has been accepted,
3674  *                this function is called (via serve()) to handle the
3675  *                main business of the communication.  This function
3676  *                returns after dealing with a single request. It can
3677  *                be called multiple times with the same client socket
3678  *                if the client is keeping the connection alive.
3679  *
3680  *                The decision whether or not a client connection will
3681  *                be kept alive is up to the caller which also must
3682  *                close the client socket when done.
3683  *
3684  *                FIXME: chat is nearly thousand lines long.
3685  *                Ridiculous.
3686  *
3687  * Parameters  :
3688  *          1  :  csp = Current client state (buffers, headers, etc...)
3689  *
3690  * Returns     :  Nothing.
3691  *
3692  *********************************************************************/
3693 static void chat(struct client_state *csp)
3694 {
3695    const struct forward_spec *fwd;
3696    struct http_request *http;
3697    /* Skeleton for HTTP response, if we should intercept the request */
3698    struct http_response *rsp;
3699 #ifdef FEATURE_HTTPS_INSPECTION
3700    int use_ssl_tunnel = 0;
3701 #endif
3702
3703    http = csp->http;
3704
3705    if (receive_client_request(csp) != JB_ERR_OK)
3706    {
3707       return;
3708    }
3709    if (parse_client_request(csp) != JB_ERR_OK)
3710    {
3711       return;
3712    }
3713
3714    /* decide how to route the HTTP request */
3715    fwd = forward_url(csp, http);
3716
3717 #ifdef FEATURE_HTTPS_INSPECTION
3718    /*
3719     * Setting flags to use old solution with SSL tunnel and to disable
3720     * certificate verification.
3721     */
3722    if (csp->http->ssl && !(csp->action->flags & ACTION_HTTPS_INSPECTION)
3723       && !cgi_page_requested(csp->http->host))
3724    {
3725       use_ssl_tunnel = 1;
3726    }
3727
3728    if (http->ssl && csp->action->flags & ACTION_IGNORE_CERTIFICATE_ERRORS)
3729    {
3730       csp->dont_verify_certificate = 1;
3731    }
3732 #endif
3733
3734    /*
3735     * build the http request to send to the server
3736     * we have to do one of the following:
3737     *
3738     * create =    use the original HTTP request to create a new
3739     *             HTTP request that has either the path component
3740     *             without the http://domainspec (w/path) or the
3741     *             full orininal URL (w/url)
3742     *             Note that the path and/or the HTTP version may
3743     *             have been altered by now.
3744     *
3745     * SSL proxy = Open a socket to the host:port of the server
3746     *             and create TLS/SSL connection with server and
3747     *             with client. Then behave like mediator between
3748     *             client and server over TLS/SSL.
3749     *
3750     * SSL proxy = Pass the request unchanged if forwarding a CONNECT
3751     *    with     request to a parent proxy. Note that we'll be sending
3752     * forwarding  the CFAIL message ourselves if connecting to the parent
3753     *             fails, but we won't send a CSUCCEED message if it works,
3754     *             since that would result in a double message (ours and the
3755     *             parent's). After sending the request to the parent, we
3756     *             must parse answer and send it to client. If connection
3757     *             with server is established, we do TLS/SSL proxy. Otherwise
3758     *             we send parent response to client and close connections.
3759     *
3760     * here's the matrix:
3761     *                        SSL
3762     *                    0        1
3763     *                +--------+--------+
3764     *                |        |        |
3765     *             0  | create |   SSL  |
3766     *                | w/path |  proxy |
3767     *  Forwarding    +--------+--------+