563c615378061935d84b67dbb05d48e6c88eabeb
[privoxy.git] / jcc.c
1 /*********************************************************************
2  *
3  * File        :  $Source: /cvsroot/ijbswa/current/jcc.c,v $
4  *
5  * Purpose     :  Main file.  Contains main() method, main loop, and
6  *                the main connection-handling function.
7  *
8  * Copyright   :  Written by and Copyright (C) 2001-2021 the
9  *                Privoxy team. https://www.privoxy.org/
10  *
11  *                Based on the Internet Junkbuster originally written
12  *                by and Copyright (C) 1997 Anonymous Coders and
13  *                Junkbusters Corporation.  http://www.junkbusters.com
14  *
15  *                This program is free software; you can redistribute it
16  *                and/or modify it under the terms of the GNU General
17  *                Public License as published by the Free Software
18  *                Foundation; either version 2 of the License, or (at
19  *                your option) any later version.
20  *
21  *                This program is distributed in the hope that it will
22  *                be useful, but WITHOUT ANY WARRANTY; without even the
23  *                implied warranty of MERCHANTABILITY or FITNESS FOR A
24  *                PARTICULAR PURPOSE.  See the GNU General Public
25  *                License for more details.
26  *
27  *                The GNU General Public License should be included with
28  *                this file.  If not, you can view it at
29  *                http://www.gnu.org/copyleft/gpl.html
30  *                or write to the Free Software Foundation, Inc., 59
31  *                Temple Place - Suite 330, Boston, MA  02111-1307, USA.
32  *
33  *********************************************************************/
34
35
36 #include "config.h"
37
38 #include <stdio.h>
39 #include <sys/types.h>
40 #include <stdlib.h>
41 #include <string.h>
42 #include <signal.h>
43 #include <fcntl.h>
44 #include <errno.h>
45 #include <assert.h>
46
47 #ifdef _WIN32
48 # ifndef FEATURE_PTHREAD
49 #  ifndef STRICT
50 #   define STRICT
51 #  endif
52 #  include <winsock2.h>
53 #  include <windows.h>
54 #  include <process.h>
55 # endif /* ndef FEATURE_PTHREAD */
56
57 # include "win32.h"
58 # ifndef _WIN_CONSOLE
59 #  include "w32log.h"
60 # endif /* ndef _WIN_CONSOLE */
61 # include "w32svrapi.h"
62
63 #else /* ifndef _WIN32 */
64
65 # include <unistd.h>
66 # include <sys/wait.h>
67 # include <sys/time.h>
68 # include <sys/stat.h>
69 # include <sys/ioctl.h>
70
71 #ifdef sun
72 #include <sys/termios.h>
73 #endif /* sun */
74
75 #ifdef unix
76 #include <pwd.h>
77 #include <grp.h>
78 #endif
79
80 # include <signal.h>
81
82 # ifdef __BEOS__
83 #  include <socket.h>  /* BeOS has select() for sockets only. */
84 #  include <OS.h>      /* declarations for threads and stuff. */
85 # endif
86
87 #ifdef HAVE_POLL
88 #ifdef __GLIBC__
89 #include <sys/poll.h>
90 #else
91 #include <poll.h>
92 #endif /* def __GLIBC__ */
93 #else
94 # ifndef FD_ZERO
95 #  include <select.h>
96 # endif
97 #warning poll() appears to be unavailable. Your platform will become unsupported in the future.
98 #endif /* HAVE_POLL */
99
100 #endif
101
102 #include "project.h"
103 #include "list.h"
104 #include "jcc.h"
105 #ifdef FEATURE_HTTPS_INSPECTION
106 #include "ssl.h"
107 #endif
108 #include "filters.h"
109 #include "loaders.h"
110 #include "parsers.h"
111 #include "miscutil.h"
112 #include "errlog.h"
113 #include "jbsockets.h"
114 #include "gateway.h"
115 #include "actions.h"
116 #include "cgi.h"
117 #include "loadcfg.h"
118 #include "urlmatch.h"
119 #ifdef FEATURE_CLIENT_TAGS
120 #include "client-tags.h"
121 #endif
122
123 int daemon_mode = 1;
124 struct client_states clients[1];
125 struct file_list     files[1];
126
127 #ifdef FEATURE_STATISTICS
128 int urls_read     = 0;     /* total nr of urls read inc rejected */
129 int urls_rejected = 0;     /* total nr of urls rejected */
130 #ifdef MUTEX_LOCKS_AVAILABLE
131 unsigned long long number_of_requests_received = 0;
132 unsigned long long number_of_requests_blocked = 0;
133 #endif
134 #endif /* def FEATURE_STATISTICS */
135
136 #ifdef FEATURE_GRACEFUL_TERMINATION
137 int g_terminate = 0;
138 #endif
139
140 #if !defined(_WIN32)
141 static void sig_handler(int the_signal);
142 #endif
143 static int client_protocol_is_unsupported(struct client_state *csp, char *req);
144 static jb_err get_request_destination_elsewhere(struct client_state *csp, struct list *headers);
145 static jb_err get_server_headers(struct client_state *csp);
146 static const char *crunch_reason(const struct http_response *rsp);
147 static void send_crunch_response(struct client_state *csp, struct http_response *rsp);
148 static char *get_request_line(struct client_state *csp);
149 static jb_err receive_client_request(struct client_state *csp);
150 static jb_err parse_client_request(struct client_state *csp);
151 static void build_request_line(struct client_state *csp, const struct forward_spec *fwd, char **request_line);
152 static jb_err change_request_destination(struct client_state *csp);
153 static void handle_established_connection(struct client_state *csp);
154 static void chat(struct client_state *csp);
155 static void serve(struct client_state *csp);
156 #if !defined(_WIN32) || defined(_WIN_CONSOLE)
157 static void usage(const char *myname);
158 #endif
159 static void initialize_mutexes(void);
160 static jb_socket bind_port_helper(const char *haddr, int hport, int backlog);
161 static void bind_ports_helper(struct configuration_spec *config, jb_socket sockets[]);
162 static void close_ports_helper(jb_socket sockets[]);
163 static void listen_loop(void);
164 static void serve(struct client_state *csp);
165
166 #ifdef __BEOS__
167 static int32 server_thread(void *data);
168 #endif /* def __BEOS__ */
169
170 #ifdef _WIN32
171 #define sleep(N)  Sleep(((N) * 1000))
172 #endif
173
174 #ifdef FUZZ
175 int process_fuzzed_input(char *fuzz_input_type, char *fuzz_input_file);
176 void show_fuzz_usage(const char *name);
177 #endif
178
179 #ifdef MUTEX_LOCKS_AVAILABLE
180 /*
181  * XXX: Does the locking stuff really belong in this file?
182  */
183 privoxy_mutex_t log_mutex;
184 privoxy_mutex_t log_init_mutex;
185 privoxy_mutex_t connection_reuse_mutex;
186
187 #ifdef FEATURE_HTTPS_INSPECTION
188 privoxy_mutex_t certificate_mutex;
189 privoxy_mutex_t ssl_init_mutex;
190 #endif
191
192 #ifdef FEATURE_EXTERNAL_FILTERS
193 privoxy_mutex_t external_filter_mutex;
194 #endif
195 #ifdef FEATURE_CLIENT_TAGS
196 privoxy_mutex_t client_tags_mutex;
197 #endif
198 #ifdef FEATURE_STATISTICS
199 privoxy_mutex_t block_statistics_mutex;
200 #endif
201 #ifdef FEATURE_EXTENDED_STATISTICS
202 privoxy_mutex_t filter_statistics_mutex;
203 privoxy_mutex_t block_reason_statistics_mutex;
204 #endif
205
206 #if !defined(HAVE_GETHOSTBYADDR_R) || !defined(HAVE_GETHOSTBYNAME_R)
207 privoxy_mutex_t resolver_mutex;
208 #endif /* !defined(HAVE_GETHOSTBYADDR_R) || !defined(HAVE_GETHOSTBYNAME_R) */
209
210 #ifndef HAVE_GMTIME_R
211 privoxy_mutex_t gmtime_mutex;
212 #endif /* ndef HAVE_GMTIME_R */
213
214 #ifndef HAVE_LOCALTIME_R
215 privoxy_mutex_t localtime_mutex;
216 #endif /* ndef HAVE_GMTIME_R */
217
218 #if !defined(HAVE_ARC4RANDOM) && !defined(HAVE_RANDOM)
219 privoxy_mutex_t rand_mutex;
220 #endif /* !defined(HAVE_ARC4RANDOM) && !defined(HAVE_RANDOM) */
221
222 #endif /* def MUTEX_LOCKS_AVAILABLE */
223
224 #if defined(unix)
225 const char *basedir = NULL;
226 const char *pidfile = NULL;
227 static int received_hup_signal = 0;
228 #endif /* defined unix */
229
230 /* HTTP snipplets. */
231 static const char CSUCCEED[] =
232    "HTTP/1.1 200 Connection established\r\n\r\n";
233
234 static const char CHEADER[] =
235    "HTTP/1.1 400 Invalid header received from client\r\n"
236    "Content-Type: text/plain\r\n"
237    "Connection: close\r\n\r\n"
238    "Invalid header received from client.\n";
239
240 static const char FTP_RESPONSE[] =
241    "HTTP/1.1 400 Invalid request received from client\r\n"
242    "Content-Type: text/plain\r\n"
243    "Connection: close\r\n\r\n"
244    "Invalid request. Privoxy doesn't support FTP.\n";
245
246 static const char GOPHER_RESPONSE[] =
247    "HTTP/1.1 400 Invalid request received from client\r\n"
248    "Content-Type: text/plain\r\n"
249    "Connection: close\r\n\r\n"
250    "Invalid request. Privoxy doesn't support gopher.\n";
251
252 /* XXX: should be a template */
253 static const char MISSING_DESTINATION_RESPONSE[] =
254    "HTTP/1.1 400 Bad request received from client\r\n"
255    "Content-Type: text/plain\r\n"
256    "Connection: close\r\n\r\n"
257    "Bad request. Privoxy was unable to extract the destination.\n";
258
259 /* XXX: should be a template */
260 static const char INVALID_SERVER_HEADERS_RESPONSE[] =
261    "HTTP/1.1 502 Server or forwarder response invalid\r\n"
262    "Content-Type: text/plain\r\n"
263    "Connection: close\r\n\r\n"
264    "Bad response. The server or forwarder response doesn't look like HTTP.\n";
265
266 /* XXX: should be a template */
267 static const char MESSED_UP_REQUEST_RESPONSE[] =
268    "HTTP/1.1 400 Malformed request after rewriting\r\n"
269    "Content-Type: text/plain\r\n"
270    "Connection: close\r\n\r\n"
271    "Bad request. Messed up with header filters.\n";
272
273 static const char TOO_MANY_CONNECTIONS_RESPONSE[] =
274    "HTTP/1.1 503 Too many open connections\r\n"
275    "Content-Type: text/plain\r\n"
276    "Connection: close\r\n\r\n"
277    "Maximum number of open connections reached.\n";
278
279 static const char CLIENT_CONNECTION_TIMEOUT_RESPONSE[] =
280    "HTTP/1.1 504 Connection timeout\r\n"
281    "Content-Type: text/plain\r\n"
282    "Connection: close\r\n\r\n"
283    "The connection timed out because the client request didn't arrive in time.\n";
284
285 static const char CLIENT_BODY_PARSE_ERROR_RESPONSE[] =
286    "HTTP/1.1 400 Failed reading client body\r\n"
287    "Content-Type: text/plain\r\n"
288    "Connection: close\r\n\r\n"
289    "Failed parsing or buffering the chunk-encoded client body.\n";
290
291 static const char UNSUPPORTED_CLIENT_EXPECTATION_ERROR_RESPONSE[] =
292    "HTTP/1.1 417 Expecting too much\r\n"
293    "Content-Type: text/plain\r\n"
294    "Connection: close\r\n\r\n"
295    "Privoxy detected an unsupported Expect header value.\n";
296
297 /* A function to crunch a response */
298 typedef struct http_response *(*crunch_func_ptr)(struct client_state *);
299
300 /* Crunch function flags */
301 #define CF_NO_FLAGS        0
302 /* Cruncher applies to forced requests as well */
303 #define CF_IGNORE_FORCE    1
304 /* Crunched requests are counted for the block statistics */
305 #define CF_COUNT_AS_REJECT 2
306
307 /* A crunch function and its flags */
308 struct cruncher
309 {
310    const crunch_func_ptr cruncher;
311    const int flags;
312 };
313
314 static int crunch_response_triggered(struct client_state *csp, const struct cruncher crunchers[]);
315
316 /* Complete list of cruncher functions */
317 static const struct cruncher crunchers_all[] = {
318    { direct_response, CF_COUNT_AS_REJECT|CF_IGNORE_FORCE},
319    { block_url,       CF_COUNT_AS_REJECT },
320 #ifdef FEATURE_TRUST
321    { trust_url,       CF_COUNT_AS_REJECT },
322 #endif /* def FEATURE_TRUST */
323    { redirect_url,    CF_NO_FLAGS  },
324    { dispatch_cgi,    CF_IGNORE_FORCE},
325    { NULL,            0 }
326 };
327
328 /* Light version, used after tags are applied */
329 static const struct cruncher crunchers_light[] = {
330    { block_url,       CF_COUNT_AS_REJECT },
331    { redirect_url,    CF_NO_FLAGS },
332    { NULL,            0 }
333 };
334
335
336 /*
337  * XXX: Don't we really mean
338  *
339  * #if defined(unix)
340  *
341  * here?
342  */
343 #if !defined(_WIN32)
344 /*********************************************************************
345  *
346  * Function    :  sig_handler
347  *
348  * Description :  Signal handler for different signals.
349  *                Exit gracefully on TERM and INT
350  *                or set a flag that will cause the errlog
351  *                to be reopened by the main thread on HUP.
352  *
353  * Parameters  :
354  *          1  :  the_signal = the signal cause this function to call
355  *
356  * Returns     :  -
357  *
358  *********************************************************************/
359 static void sig_handler(int the_signal)
360 {
361    switch(the_signal)
362    {
363       case SIGTERM:
364       case SIGINT:
365          log_error(LOG_LEVEL_INFO, "exiting by signal %d .. bye", the_signal);
366 #if defined(unix)
367          if (pidfile)
368          {
369             unlink(pidfile);
370          }
371 #endif /* unix */
372          exit(the_signal);
373          break;
374
375       case SIGHUP:
376 #if defined(unix)
377          received_hup_signal = 1;
378 #endif
379          break;
380
381       default:
382          /*
383           * We shouldn't be here, unless we catch signals
384           * in main() that we can't handle here!
385           */
386          log_error(LOG_LEVEL_FATAL,
387             "sig_handler: exiting on unexpected signal %d", the_signal);
388    }
389    return;
390
391 }
392 #endif
393
394
395 /*********************************************************************
396  *
397  * Function    :  get_write_delay
398  *
399  * Description :  Parse the delay-response parameter.
400  *
401  * Parameters  :
402  *          1  :  csp = Current client state (buffers, headers, etc...)
403  *
404  * Returns     :  Number of milliseconds to delay writes.
405  *
406  *********************************************************************/
407 static unsigned int get_write_delay(const struct client_state *csp)
408 {
409    unsigned int delay;
410    char *endptr;
411    char *newval;
412
413    if ((csp->action->flags & ACTION_DELAY_RESPONSE) == 0)
414    {
415       return 0;
416    }
417    newval = csp->action->string[ACTION_STRING_DELAY_RESPONSE];
418
419    delay = (unsigned)strtol(newval, &endptr, 0);
420    if (*endptr != '\0')
421    {
422       log_error(LOG_LEVEL_FATAL,
423          "Invalid delay-response{} parameter: '%s'", newval);
424    }
425
426    return delay;
427
428 }
429
430
431 /*********************************************************************
432  *
433  * Function    :  client_protocol_is_unsupported
434  *
435  * Description :  Checks if the client used a known unsupported
436  *                protocol and deals with it by sending an error
437  *                response.
438  *
439  * Parameters  :
440  *          1  :  csp = Current client state (buffers, headers, etc...)
441  *          2  :  req = the first request line send by the client
442  *
443  * Returns     :  TRUE if an error response has been generated, or
444  *                FALSE if the request doesn't look invalid.
445  *
446  *********************************************************************/
447 static int client_protocol_is_unsupported(struct client_state *csp, char *req)
448 {
449    /*
450     * If it's a FTP or gopher request, we don't support it.
451     *
452     * These checks are better than nothing, but they might
453     * not work in all configurations and some clients might
454     * have problems digesting the answer.
455     *
456     * They should, however, never cause more problems than
457     * Privoxy's old behaviour (returning the misleading HTML
458     * error message:
459     *
460     * "Could not resolve http://(ftp|gopher)://example.org").
461     */
462    if (!strncmpic(req, "GET ftp://", 10) || !strncmpic(req, "GET gopher://", 13))
463    {
464       const char *response = NULL;
465       const char *protocol = NULL;
466
467       if (!strncmpic(req, "GET ftp://", 10))
468       {
469          response = FTP_RESPONSE;
470          protocol = "FTP";
471       }
472       else
473       {
474          response = GOPHER_RESPONSE;
475          protocol = "GOPHER";
476       }
477       log_error(LOG_LEVEL_ERROR,
478          "%s tried to use Privoxy as %s proxy: %s",
479          csp->ip_addr_str, protocol, req);
480       log_error(LOG_LEVEL_CLF,
481          "%s - - [%T] \"%s\" 400 0", csp->ip_addr_str, req);
482       freez(req);
483
484 #ifdef FEATURE_HTTPS_INSPECTION
485       if (client_use_ssl(csp))
486       {
487          ssl_send_data_delayed(&(csp->ssl_client_attr),
488             (const unsigned char *)response, strlen(response),
489             get_write_delay(csp));
490       }
491       else
492 #endif
493       {
494          write_socket_delayed(csp->cfd, response, strlen(response),
495             get_write_delay(csp));
496       }
497
498       return TRUE;
499    }
500
501    return FALSE;
502 }
503
504
505 /*********************************************************************
506  *
507  * Function    :  client_has_unsupported_expectations
508  *
509  * Description :  Checks if the client used an unsupported expectation
510  *                in which case an error message is delivered.
511  *
512  * Parameters  :
513  *          1  :  csp = Current client state (buffers, headers, etc...)
514  *
515  * Returns     :  TRUE if an error response has been generated, or
516  *                FALSE if the request doesn't look invalid.
517  *
518  *********************************************************************/
519 static int client_has_unsupported_expectations(const struct client_state *csp)
520 {
521    if ((csp->flags & CSP_FLAG_UNSUPPORTED_CLIENT_EXPECTATION))
522    {
523       log_error(LOG_LEVEL_ERROR,
524          "Rejecting request from client %s with unsupported Expect header value",
525          csp->ip_addr_str);
526       log_error(LOG_LEVEL_CLF,
527          "%s - - [%T] \"%s\" 417 0", csp->ip_addr_str, csp->http->cmd);
528       write_socket_delayed(csp->cfd,
529          UNSUPPORTED_CLIENT_EXPECTATION_ERROR_RESPONSE,
530          strlen(UNSUPPORTED_CLIENT_EXPECTATION_ERROR_RESPONSE),
531          get_write_delay(csp));
532
533       return TRUE;
534    }
535
536    return FALSE;
537
538 }
539
540
541 /*********************************************************************
542  *
543  * Function    :  get_request_destination_elsewhere
544  *
545  * Description :  If the client's request was redirected into
546  *                Privoxy without the client's knowledge,
547  *                the request line lacks the destination host.
548  *
549  *                This function tries to get it elsewhere,
550  *                provided accept-intercepted-requests is enabled.
551  *
552  *                "Elsewhere" currently only means "Host: header",
553  *                but in the future we may ask the redirecting
554  *                packet filter to look the destination up.
555  *
556  *                If the destination stays unknown, an error
557  *                response is send to the client and headers
558  *                are freed so that chat() can return directly.
559  *
560  * Parameters  :
561  *          1  :  csp = Current client state (buffers, headers, etc...)
562  *          2  :  headers = a header list
563  *
564  * Returns     :  JB_ERR_OK if the destination is now known, or
565  *                JB_ERR_PARSE if it isn't.
566  *
567  *********************************************************************/
568 static jb_err get_request_destination_elsewhere(struct client_state *csp, struct list *headers)
569 {
570    if (!(csp->config->feature_flags & RUNTIME_FEATURE_ACCEPT_INTERCEPTED_REQUESTS))
571    {
572       log_error(LOG_LEVEL_ERROR, "%s's request: \'%s\' is invalid."
573          " Privoxy isn't configured to accept intercepted requests.",
574          csp->ip_addr_str, csp->http->cmd);
575       /* XXX: Use correct size */
576       log_error(LOG_LEVEL_CLF, "%s - - [%T] \"%s\" 400 0",
577          csp->ip_addr_str, csp->http->cmd);
578
579       write_socket_delayed(csp->cfd, CHEADER, strlen(CHEADER),
580          get_write_delay(csp));
581       destroy_list(headers);
582
583       return JB_ERR_PARSE;
584    }
585    else if (JB_ERR_OK == get_destination_from_headers(headers, csp->http))
586    {
587       /* Split the domain we just got for pattern matching */
588       init_domain_components(csp->http);
589
590       return JB_ERR_OK;
591    }
592    else
593    {
594       /* We can't work without destination. Go spread the news.*/
595
596       /* XXX: Use correct size */
597       log_error(LOG_LEVEL_CLF, "%s - - [%T] \"%s\" 400 0",
598          csp->ip_addr_str, csp->http->cmd);
599       log_error(LOG_LEVEL_ERROR,
600          "Privoxy was unable to get the destination for %s's request: %s",
601          csp->ip_addr_str, csp->http->cmd);
602
603       write_socket_delayed(csp->cfd, MISSING_DESTINATION_RESPONSE,
604          strlen(MISSING_DESTINATION_RESPONSE), get_write_delay(csp));
605       destroy_list(headers);
606
607       return JB_ERR_PARSE;
608    }
609    /*
610     * TODO: If available, use PF's ioctl DIOCNATLOOK as last resort
611     * to get the destination IP address, use it as host directly
612     * or do a reverse DNS lookup first.
613     */
614 }
615
616
617 /*********************************************************************
618  *
619  * Function    :  get_server_headers
620  *
621  * Description :  Parses server headers in iob and fills them
622  *                into csp->headers so that they can later be
623  *                handled by sed().
624  *
625  * Parameters  :
626  *          1  :  csp = Current client state (buffers, headers, etc...)
627  *
628  * Returns     :  JB_ERR_OK if everything went fine, or
629  *                JB_ERR_PARSE if the headers were incomplete.
630  *
631  *********************************************************************/
632 static jb_err get_server_headers(struct client_state *csp)
633 {
634    int continue_hack_in_da_house = 0;
635    char * header;
636
637    while (((header = get_header(csp->iob)) != NULL) || continue_hack_in_da_house)
638    {
639       if (header == NULL)
640       {
641          /*
642           * continue hack in da house. Ignore the ending of
643           * this head and continue enlisting header lines.
644           * The reason is described below.
645           */
646          enlist(csp->headers, "");
647          continue_hack_in_da_house = 0;
648          continue;
649       }
650       else if (0 == strncmpic(header, "HTTP/1.1 100", 12))
651       {
652          /*
653           * It's a bodyless continue response, don't
654           * stop header parsing after reaching its end.
655           *
656           * As a result Privoxy will concatenate the
657           * next response's head and parse and deliver
658           * the headers as if they belonged to one request.
659           *
660           * The client will separate them because of the
661           * empty line between them.
662           *
663           * XXX: What we're doing here is clearly against
664           * the intended purpose of the continue header,
665           * and under some conditions (HTTP/1.0 client request)
666           * it's a standard violation.
667           *
668           * Anyway, "sort of against the spec" is preferable
669           * to "always getting confused by Continue responses"
670           * (Privoxy's behaviour before this hack was added)
671           */
672          log_error(LOG_LEVEL_HEADER, "Continue hack in da house.");
673          continue_hack_in_da_house = 1;
674       }
675       else if (*header == '\0')
676       {
677          /*
678           * If the header is empty, but the Continue hack
679           * isn't active, we can assume that we reached the
680           * end of the buffer before we hit the end of the
681           * head.
682           *
683           * Inform the caller an let it decide how to handle it.
684           */
685          return JB_ERR_PARSE;
686       }
687
688       if (JB_ERR_MEMORY == enlist(csp->headers, header))
689       {
690          /*
691           * XXX: Should we quit the request and return a
692           * out of memory error page instead?
693           */
694          log_error(LOG_LEVEL_ERROR,
695             "Out of memory while enlisting server headers. %s lost.",
696             header);
697       }
698       freez(header);
699    }
700
701    return JB_ERR_OK;
702 }
703
704
705 /*********************************************************************
706  *
707  * Function    :  crunch_reason
708  *
709  * Description :  Translates the crunch reason code into a string.
710  *
711  * Parameters  :
712  *          1  :  rsp = a http_response
713  *
714  * Returns     :  A string with the crunch reason or an error description.
715  *
716  *********************************************************************/
717 static const char *crunch_reason(const struct http_response *rsp)
718 {
719    char * reason = NULL;
720
721    assert(rsp != NULL);
722    if (rsp == NULL)
723    {
724       return "Internal error while searching for crunch reason";
725    }
726
727    switch (rsp->crunch_reason)
728    {
729       case UNSUPPORTED:
730          reason = "Unsupported HTTP feature";
731          break;
732       case BLOCKED:
733          reason = "Blocked";
734          break;
735       case UNTRUSTED:
736          reason = "Untrusted";
737          break;
738       case REDIRECTED:
739          reason = "Redirected";
740          break;
741       case CGI_CALL:
742          reason = "CGI Call";
743          break;
744       case NO_SUCH_DOMAIN:
745          reason = "DNS failure";
746          break;
747       case FORWARDING_FAILED:
748          reason = "Forwarding failed";
749          break;
750       case CONNECT_FAILED:
751          reason = "Connection failure";
752          break;
753       case OUT_OF_MEMORY:
754          reason = "Out of memory (may mask other reasons)";
755          break;
756       case CONNECTION_TIMEOUT:
757          reason = "Connection timeout";
758          break;
759       case NO_SERVER_DATA:
760          reason = "No server data received";
761          break;
762       default:
763          reason = "No reason recorded";
764          break;
765    }
766
767    return reason;
768 }
769
770
771 /*********************************************************************
772  *
773  * Function    :  log_applied_actions
774  *
775  * Description :  Logs the applied actions if LOG_LEVEL_ACTIONS is
776  *                enabled.
777  *
778  * Parameters  :
779  *          1  :  actions = Current action spec to log
780  *
781  * Returns     :  Nothing.
782  *
783  *********************************************************************/
784 static void log_applied_actions(const struct current_action_spec *actions)
785 {
786    /*
787     * The conversion to text requires lots of memory allocations so
788     * we only do the conversion if the user is actually interested.
789     */
790    if (debug_level_is_enabled(LOG_LEVEL_ACTIONS))
791    {
792       char *actions_as_text = actions_to_line_of_text(actions);
793       log_error(LOG_LEVEL_ACTIONS, "%s", actions_as_text);
794       freez(actions_as_text);
795    }
796 }
797
798
799 /*********************************************************************
800  *
801  * Function    :  send_crunch_response
802  *
803  * Description :  Delivers already prepared response for
804  *                intercepted requests, logs the interception
805  *                and frees the response.
806  *
807  * Parameters  :
808  *          1  :  csp = Current client state (buffers, headers, etc...)
809  *          2  :  rsp = Fully prepared response. Will be freed on exit.
810  *
811  * Returns     :  Nothing.
812  *
813  *********************************************************************/
814 static void send_crunch_response(struct client_state *csp, struct http_response *rsp)
815 {
816       const struct http_request *http = csp->http;
817       char status_code[4];
818
819       assert(rsp != NULL);
820       assert(rsp->head != NULL);
821
822       if (rsp == NULL)
823       {
824          log_error(LOG_LEVEL_FATAL, "NULL response in send_crunch_response.");
825       }
826
827       /*
828        * Extract the status code from the actual head
829        * that will be send to the client. It is the only
830        * way to get it right for all requests, including
831        * the fixed ones for out-of-memory problems.
832        *
833        * A head starts like this: 'HTTP/1.1 200...'
834        *                           0123456789|11
835        *                                     10
836        */
837       status_code[0] = rsp->head[9];
838       status_code[1] = rsp->head[10];
839       status_code[2] = rsp->head[11];
840       status_code[3] = '\0';
841
842       /* Log that the request was crunched and why. */
843       log_applied_actions(csp->action);
844 #ifdef FEATURE_HTTPS_INSPECTION
845       if (client_use_ssl(csp))
846       {
847          log_error(LOG_LEVEL_CRUNCH, "%s: https://%s%s", crunch_reason(rsp),
848             http->hostport, http->path);
849          log_error(LOG_LEVEL_CLF, "%s - - [%T] \"%s https://%s%s %s\" %s %lu",
850             csp->ip_addr_str, http->gpc, http->hostport, http->path,
851             http->version, status_code, rsp->content_length);
852       }
853       else
854 #endif
855       {
856          log_error(LOG_LEVEL_CRUNCH, "%s: %s", crunch_reason(rsp), http->url);
857          log_error(LOG_LEVEL_CLF, "%s - - [%T] \"%s\" %s %lu",
858             csp->ip_addr_str, http->ocmd, status_code, rsp->content_length);
859       }
860       /* Write the answer to the client */
861 #ifdef FEATURE_HTTPS_INSPECTION
862       if (client_use_ssl(csp))
863       {
864          if ((ssl_send_data_delayed(&(csp->ssl_client_attr),
865                 (const unsigned char *)rsp->head, rsp->head_length,
866                 get_write_delay(csp)) < 0)
867           || (ssl_send_data_delayed(&(csp->ssl_client_attr),
868                 (const unsigned char *)rsp->body, rsp->content_length,
869                 get_write_delay(csp)) < 0))
870          {
871             /* There is nothing we can do about it. */
872             log_error(LOG_LEVEL_CONNECT, "Couldn't deliver the error message "
873                "for https://%s%s through client socket %d using TLS/SSL",
874                http->hostport, http->url, csp->cfd);
875          }
876       }
877       else
878 #endif
879       {
880          if (write_socket_delayed(csp->cfd, rsp->head, rsp->head_length,
881                 get_write_delay(csp))
882           || write_socket_delayed(csp->cfd, rsp->body, rsp->content_length,
883                 get_write_delay(csp)))
884          {
885             /* There is nothing we can do about it. */
886             log_error(LOG_LEVEL_CONNECT,
887                "Couldn't deliver the error message for %s through client socket %d: %E",
888                http->url, csp->cfd);
889          }
890       }
891
892       /* Clean up and return */
893       if (cgi_error_memory() != rsp)
894       {
895          free_http_response(rsp);
896       }
897       return;
898 }
899
900
901 /*********************************************************************
902  *
903  * Function    :  crunch_response_triggered
904  *
905  * Description :  Checks if the request has to be crunched,
906  *                and delivers the crunch response if necessary.
907  *
908  * Parameters  :
909  *          1  :  csp = Current client state (buffers, headers, etc...)
910  *          2  :  crunchers = list of cruncher functions to run
911  *
912  * Returns     :  TRUE if the request was answered with a crunch response
913  *                FALSE otherwise.
914  *
915  *********************************************************************/
916 static int crunch_response_triggered(struct client_state *csp, const struct cruncher crunchers[])
917 {
918    struct http_response *rsp = NULL;
919    const struct cruncher *c;
920
921    /*
922     * If CGI request crunching is disabled,
923     * check the CGI dispatcher out of order to
924     * prevent unintentional blocks or redirects.
925     */
926    if (!(csp->config->feature_flags & RUNTIME_FEATURE_CGI_CRUNCHING)
927        && (NULL != (rsp = dispatch_cgi(csp))))
928    {
929       /* Deliver, log and free the interception response. */
930       send_crunch_response(csp, rsp);
931       csp->flags |= CSP_FLAG_CRUNCHED;
932       return TRUE;
933    }
934
935    for (c = crunchers; c->cruncher != NULL; c++)
936    {
937       /*
938        * Check the cruncher if either Privoxy is toggled
939        * on and the request isn't forced, or if the cruncher
940        * applies to forced requests as well.
941        */
942       if (((csp->flags & CSP_FLAG_TOGGLED_ON) &&
943           !(csp->flags & CSP_FLAG_FORCED)) ||
944           (c->flags & CF_IGNORE_FORCE))
945       {
946          rsp = c->cruncher(csp);
947          if (NULL != rsp)
948          {
949             /* Deliver, log and free the interception response. */
950             send_crunch_response(csp, rsp);
951             csp->flags |= CSP_FLAG_CRUNCHED;
952 #ifdef FEATURE_STATISTICS
953             if (c->flags & CF_COUNT_AS_REJECT)
954             {
955 #ifdef MUTEX_LOCKS_AVAILABLE
956                privoxy_mutex_lock(&block_statistics_mutex);
957                number_of_requests_blocked++;
958                privoxy_mutex_unlock(&block_statistics_mutex);
959 #endif
960                csp->flags |= CSP_FLAG_REJECTED;
961             }
962 #endif /* def FEATURE_STATISTICS */
963
964             return TRUE;
965          }
966       }
967    }
968
969    return FALSE;
970 }
971
972
973 /*********************************************************************
974  *
975  * Function    :  build_request_line
976  *
977  * Description :  Builds the HTTP request line.
978  *
979  *                If a HTTP forwarder is used it expects the whole URL,
980  *                web servers only get the path.
981  *
982  * Parameters  :
983  *          1  :  csp = Current client state (buffers, headers, etc...)
984  *          2  :  fwd = The forwarding spec used for the request.
985  *                      Can be NULL.
986  *          3  :  request_line = The old request line which will be replaced.
987  *
988  * Returns     :  Nothing. Terminates in case of memory problems.
989  *
990  *********************************************************************/
991 static void build_request_line(struct client_state *csp, const struct forward_spec *fwd, char **request_line)
992 {
993    struct http_request *http = csp->http;
994
995    /*
996     * Downgrade http version from 1.1 to 1.0
997     * if +downgrade action applies.
998     */
999    if ((csp->action->flags & ACTION_DOWNGRADE)
1000      && (!strcmpic(http->version, "HTTP/1.1")))
1001    {
1002       freez(http->version);
1003       http->version = strdup_or_die("HTTP/1.0");
1004    }
1005
1006    /*
1007     * Rebuild the request line.
1008     */
1009    freez(*request_line);
1010 #ifdef FEATURE_HTTPS_INSPECTION
1011    if (fwd != NULL && fwd->forward_host &&
1012        fwd->type != FORWARD_WEBSERVER && client_use_ssl(csp))
1013    {
1014       *request_line = strdup("CONNECT ");
1015    }
1016    else
1017 #endif
1018    {
1019       *request_line = strdup(http->gpc);
1020       string_append(request_line, " ");
1021    }
1022
1023    if (fwd != NULL && fwd->forward_host && fwd->type != FORWARD_WEBSERVER)
1024    {
1025 #ifdef FEATURE_HTTPS_INSPECTION
1026       if (client_use_ssl(csp))
1027       {
1028          char port_string[10];
1029
1030          string_append(request_line, http->host);
1031          snprintf(port_string, sizeof(port_string), ":%d", http->port);
1032          string_append(request_line, port_string);
1033       }
1034       else
1035 #endif
1036       {
1037          string_append(request_line, http->url);
1038       }
1039    }
1040    else
1041    {
1042       string_append(request_line, http->path);
1043    }
1044    string_append(request_line, " ");
1045    string_append(request_line, http->version);
1046
1047    if (*request_line == NULL)
1048    {
1049       log_error(LOG_LEVEL_FATAL, "Out of memory writing HTTP command");
1050    }
1051    log_error(LOG_LEVEL_HEADER, "New HTTP Request-Line: %s", *request_line);
1052 }
1053
1054
1055 /*********************************************************************
1056  *
1057  * Function    :  change_request_destination
1058  *
1059  * Description :  Parse a (rewritten) request line and regenerate
1060  *                the http request data.
1061  *
1062  * Parameters  :
1063  *          1  :  csp = Current client state (buffers, headers, etc...)
1064  *
1065  * Returns     :  Forwards the parse_http_request() return code.
1066  *                Terminates in case of memory problems.
1067  *
1068  *********************************************************************/
1069 static jb_err change_request_destination(struct client_state *csp)
1070 {
1071    struct http_request *http = csp->http;
1072    jb_err err;
1073
1074    log_error(LOG_LEVEL_REDIRECTS, "Rewrite detected: %s",
1075       csp->headers->first->str);
1076    free_http_request(http);
1077    err = parse_http_request(csp->headers->first->str, http);
1078    if (JB_ERR_OK != err)
1079    {
1080       log_error(LOG_LEVEL_ERROR, "Couldn't parse rewritten request: %s.",
1081          jb_err_to_string(err));
1082    }
1083    if (http->ssl && strcmpic(csp->http->gpc, "CONNECT"))
1084    {
1085       /*
1086        * A client header filter changed the request URL from
1087        * http:// to https:// which we currently don't support.
1088        */
1089       log_error(LOG_LEVEL_ERROR, "Changing the request destination from http "
1090          "to https behind the client's back currently isn't supported.");
1091       return JB_ERR_PARSE;
1092    }
1093
1094    return err;
1095 }
1096
1097
1098 #ifdef FEATURE_CONNECTION_KEEP_ALIVE
1099 /*********************************************************************
1100  *
1101  * Function    :  server_response_is_complete
1102  *
1103  * Description :  Determines whether we should stop reading
1104  *                from the server socket.
1105  *
1106  * Parameters  :
1107  *          1  :  csp = Current client state (buffers, headers, etc...)
1108  *          2  :  content_length = Length of content received so far.
1109  *
1110  * Returns     :  TRUE if the response is complete,
1111  *                FALSE otherwise.
1112  *
1113  *********************************************************************/
1114 static int server_response_is_complete(struct client_state *csp,
1115    unsigned long long content_length)
1116 {
1117    int content_length_known = !!(csp->flags & CSP_FLAG_CONTENT_LENGTH_SET);
1118
1119    if (!strcmpic(csp->http->gpc, "HEAD"))
1120    {
1121       /*
1122        * "HEAD" implies no body, we are thus expecting
1123        * no content. XXX: incomplete "list" of methods?
1124        */
1125       csp->expected_content_length = 0;
1126       content_length_known = TRUE;
1127       csp->flags |= CSP_FLAG_SERVER_CONTENT_LENGTH_SET;
1128    }
1129
1130    if (csp->http->status == 204 || csp->http->status == 304)
1131    {
1132       /*
1133        * Expect no body. XXX: incomplete "list" of status codes?
1134        */
1135       csp->expected_content_length = 0;
1136       content_length_known = TRUE;
1137       csp->flags |= CSP_FLAG_SERVER_CONTENT_LENGTH_SET;
1138    }
1139
1140    return (content_length_known && ((0 == csp->expected_content_length)
1141             || (csp->expected_content_length <= content_length)));
1142 }
1143
1144
1145 #ifdef FEATURE_CONNECTION_SHARING
1146 /*********************************************************************
1147  *
1148  * Function    :  wait_for_alive_connections
1149  *
1150  * Description :  Waits for alive connections to timeout.
1151  *
1152  * Parameters  :  N/A
1153  *
1154  * Returns     :  N/A
1155  *
1156  *********************************************************************/
1157 static void wait_for_alive_connections(void)
1158 {
1159    int connections_alive = close_unusable_connections();
1160
1161    while (0 < connections_alive)
1162    {
1163       log_error(LOG_LEVEL_CONNECT,
1164          "Waiting for %d connections to timeout.",
1165          connections_alive);
1166       sleep(60);
1167       connections_alive = close_unusable_connections();
1168    }
1169
1170    log_error(LOG_LEVEL_CONNECT, "No connections to wait for left.");
1171
1172 }
1173 #endif /* def FEATURE_CONNECTION_SHARING */
1174
1175
1176 /*********************************************************************
1177  *
1178  * Function    :  save_connection_destination
1179  *
1180  * Description :  Remembers a connection for reuse later on.
1181  *
1182  * Parameters  :
1183  *          1  :  sfd  = Open socket to remember.
1184  *          2  :  http = The destination for the connection.
1185  *          3  :  fwd  = The forwarder settings used.
1186  *          4  :  server_connection  = storage.
1187  *
1188  * Returns     : void
1189  *
1190  *********************************************************************/
1191 static void save_connection_destination(jb_socket sfd,
1192                                         const struct http_request *http,
1193                                         const struct forward_spec *fwd,
1194                                         struct reusable_connection *server_connection)
1195 {
1196    assert(sfd != JB_INVALID_SOCKET);
1197    assert(NULL != http->host);
1198
1199    server_connection->sfd = sfd;
1200    server_connection->host = strdup_or_die(http->host);
1201    server_connection->port = http->port;
1202
1203    assert(NULL != fwd);
1204    assert(server_connection->gateway_host == NULL);
1205    assert(server_connection->gateway_port == 0);
1206    assert(server_connection->forwarder_type == 0);
1207    assert(server_connection->forward_host == NULL);
1208    assert(server_connection->forward_port == 0);
1209
1210    server_connection->forwarder_type = fwd->type;
1211    if (NULL != fwd->gateway_host)
1212    {
1213       server_connection->gateway_host = strdup_or_die(fwd->gateway_host);
1214    }
1215    else
1216    {
1217       server_connection->gateway_host = NULL;
1218    }
1219    server_connection->gateway_port = fwd->gateway_port;
1220    if (NULL != fwd->auth_username)
1221    {
1222       server_connection->auth_username = strdup_or_die(fwd->auth_username);
1223    }
1224    else
1225    {
1226       server_connection->auth_username = NULL;
1227    }
1228    if (NULL != fwd->auth_password)
1229    {
1230       server_connection->auth_password = strdup_or_die(fwd->auth_password);
1231    }
1232    else
1233    {
1234       server_connection->auth_password = NULL;
1235    }
1236
1237    if (NULL != fwd->forward_host)
1238    {
1239       server_connection->forward_host = strdup_or_die(fwd->forward_host);
1240    }
1241    else
1242    {
1243       server_connection->forward_host = NULL;
1244    }
1245    server_connection->forward_port = fwd->forward_port;
1246 }
1247 #endif /* FEATURE_CONNECTION_KEEP_ALIVE */
1248
1249
1250 /*********************************************************************
1251  *
1252  * Function    : verify_request_length
1253  *
1254  * Description : Checks if we already got the whole client requests
1255  *               and sets CSP_FLAG_CLIENT_REQUEST_COMPLETELY_READ if
1256  *               we do.
1257  *
1258  *               Data that doesn't belong to the current request is
1259  *               either thrown away to let the client retry on a clean
1260  *               socket, or stashed to be dealt with after the current
1261  *               request is served.
1262  *
1263  * Parameters  :
1264  *          1  :  csp = Current client state (buffers, headers, etc...)
1265  *
1266  * Returns     :  void
1267  *
1268  *********************************************************************/
1269 static void verify_request_length(struct client_state *csp)
1270 {
1271    unsigned long long buffered_request_bytes =
1272       (unsigned long long)(csp->client_iob->eod - csp->client_iob->cur);
1273
1274    if ((csp->expected_client_content_length != 0)
1275       && (buffered_request_bytes != 0))
1276    {
1277       if (csp->expected_client_content_length >= buffered_request_bytes)
1278       {
1279          csp->expected_client_content_length -= buffered_request_bytes;
1280          log_error(LOG_LEVEL_CONNECT, "Reduced expected bytes to %llu "
1281             "to account for the %llu ones we already got.",
1282             csp->expected_client_content_length, buffered_request_bytes);
1283       }
1284       else
1285       {
1286          assert(csp->client_iob->eod > csp->client_iob->cur + csp->expected_client_content_length);
1287          csp->client_iob->eod = csp->client_iob->cur + csp->expected_client_content_length;
1288          log_error(LOG_LEVEL_CONNECT, "Reducing expected bytes to 0. "
1289             "Marking the server socket tainted after throwing %llu bytes away.",
1290             buffered_request_bytes - csp->expected_client_content_length);
1291          csp->expected_client_content_length = 0;
1292          csp->flags |= CSP_FLAG_SERVER_SOCKET_TAINTED;
1293       }
1294
1295       if (csp->expected_client_content_length == 0)
1296       {
1297          csp->flags |= CSP_FLAG_CLIENT_REQUEST_COMPLETELY_READ;
1298       }
1299    }
1300
1301    if (!(csp->flags & CSP_FLAG_CLIENT_REQUEST_COMPLETELY_READ)
1302       && ((csp->client_iob->cur < csp->client_iob->eod)
1303          || (csp->expected_client_content_length != 0)))
1304    {
1305       if (strcmpic(csp->http->gpc, "GET")
1306          && strcmpic(csp->http->gpc, "HEAD")
1307          && strcmpic(csp->http->gpc, "TRACE")
1308          && strcmpic(csp->http->gpc, "OPTIONS")
1309          && strcmpic(csp->http->gpc, "DELETE"))
1310       {
1311          /* XXX: this is an incomplete hack */
1312          csp->flags &= ~CSP_FLAG_CLIENT_REQUEST_COMPLETELY_READ;
1313          log_error(LOG_LEVEL_CONNECT, "There better be a request body.");
1314       }
1315       else
1316       {
1317          csp->flags |= CSP_FLAG_CLIENT_REQUEST_COMPLETELY_READ;
1318
1319          if ((csp->config->feature_flags & RUNTIME_FEATURE_TOLERATE_PIPELINING) == 0)
1320          {
1321             csp->flags |= CSP_FLAG_SERVER_SOCKET_TAINTED;
1322             log_error(LOG_LEVEL_CONNECT,
1323                "Possible pipeline attempt detected. The connection will not "
1324                "be kept alive and we will only serve the first request.");
1325             /* Nuke the pipelined requests from orbit, just to be sure. */
1326             clear_iob(csp->client_iob);
1327          }
1328          else
1329          {
1330             /*
1331              * Keep the pipelined data around for now, we'll deal with
1332              * it once we're done serving the current request.
1333              */
1334             csp->flags |= CSP_FLAG_PIPELINED_REQUEST_WAITING;
1335             assert(csp->client_iob->eod >= csp->client_iob->cur);
1336             log_error(LOG_LEVEL_CONNECT, "Complete client request followed by "
1337                "%d bytes of pipelined data received.",
1338                (int)(csp->client_iob->eod - csp->client_iob->cur));
1339          }
1340       }
1341    }
1342    else
1343    {
1344       csp->flags |= CSP_FLAG_CLIENT_REQUEST_COMPLETELY_READ;
1345       log_error(LOG_LEVEL_CONNECT, "Complete client request received.");
1346    }
1347 }
1348
1349
1350 /*********************************************************************
1351  *
1352  * Function    :  mark_server_socket_tainted
1353  *
1354  * Description :  Makes sure we don't reuse a server socket
1355  *                (if we didn't read everything the server sent
1356  *                us reusing the socket would lead to garbage).
1357  *
1358  * Parameters  :
1359  *          1  :  csp = Current client state (buffers, headers, etc...)
1360  *
1361  * Returns     :  void.
1362  *
1363  *********************************************************************/
1364 static void mark_server_socket_tainted(struct client_state *csp)
1365 {
1366    /*
1367     * For consistency we always mark the server socket
1368     * tainted, however, to reduce the log noise we only
1369     * emit a log message if the server socket could have
1370     * actually been reused.
1371     */
1372    if ((csp->flags & CSP_FLAG_SERVER_CONNECTION_KEEP_ALIVE)
1373       && !(csp->flags & CSP_FLAG_SERVER_SOCKET_TAINTED))
1374    {
1375       log_error(LOG_LEVEL_CONNECT,
1376          "Marking the server socket %d tainted.",
1377          csp->server_connection.sfd);
1378    }
1379    csp->flags |= CSP_FLAG_SERVER_SOCKET_TAINTED;
1380 }
1381
1382 /*********************************************************************
1383  *
1384  * Function    :  get_request_line
1385  *
1386  * Description : Read the client request line.
1387  *
1388  * Parameters  :
1389  *          1  :  csp = Current client state (buffers, headers, etc...)
1390  *
1391  * Returns     :  Pointer to request line or NULL in case of errors.
1392  *
1393  *********************************************************************/
1394 static char *get_request_line(struct client_state *csp)
1395 {
1396    char buf[BUFFER_SIZE];
1397    char *request_line = NULL;
1398    int len;
1399
1400    memset(buf, 0, sizeof(buf));
1401
1402    if ((csp->flags & CSP_FLAG_PIPELINED_REQUEST_WAITING) != 0)
1403    {
1404       /*
1405        * If there are multiple pipelined requests waiting,
1406        * the flag will be set again once the next request
1407        * has been parsed.
1408        */
1409       csp->flags &= ~CSP_FLAG_PIPELINED_REQUEST_WAITING;
1410
1411       request_line = get_header(csp->client_iob);
1412       if ((NULL != request_line) && ('\0' != *request_line))
1413       {
1414          return request_line;
1415       }
1416       else
1417       {
1418          log_error(LOG_LEVEL_CONNECT, "No complete request line "
1419             "received yet. Continuing reading from %d.", csp->cfd);
1420       }
1421    }
1422
1423    do
1424    {
1425       if (
1426 #ifdef FUZZ
1427           0 == (csp->flags & CSP_FLAG_FUZZED_INPUT) &&
1428 #endif
1429           !data_is_available(csp->cfd, csp->config->socket_timeout)
1430           )
1431       {
1432          if (socket_is_still_alive(csp->cfd))
1433          {
1434             log_error(LOG_LEVEL_CONNECT,
1435                "No request line on socket %d received in time. Timeout: %d.",
1436                csp->cfd, csp->config->socket_timeout);
1437             write_socket_delayed(csp->cfd, CLIENT_CONNECTION_TIMEOUT_RESPONSE,
1438                strlen(CLIENT_CONNECTION_TIMEOUT_RESPONSE),
1439                get_write_delay(csp));
1440          }
1441          else
1442          {
1443             log_error(LOG_LEVEL_CONNECT,
1444                "The client side of the connection on socket %d got "
1445                "closed without sending a complete request line.", csp->cfd);
1446          }
1447          return NULL;
1448       }
1449
1450       len = read_socket(csp->cfd, buf, sizeof(buf) - 1);
1451
1452       if (len <= 0) return NULL;
1453
1454       /*
1455        * If there is no memory left for buffering the
1456        * request, there is nothing we can do but hang up
1457        */
1458       if (add_to_iob(csp->client_iob, csp->config->buffer_limit, buf, len))
1459       {
1460          return NULL;
1461       }
1462
1463       request_line = get_header(csp->client_iob);
1464
1465    } while ((NULL != request_line) && ('\0' == *request_line));
1466
1467    return request_line;
1468
1469 }
1470
1471 enum chunk_status
1472 {
1473    CHUNK_STATUS_MISSING_DATA,
1474    CHUNK_STATUS_BODY_COMPLETE,
1475    CHUNK_STATUS_PARSE_ERROR
1476 };
1477
1478
1479 /*********************************************************************
1480  *
1481  * Function    :  chunked_body_is_complete
1482  *
1483  * Description :  Figures out whether or not a chunked body is complete.
1484  *
1485  *                Currently it always starts at the beginning of the
1486  *                buffer which is somewhat wasteful and prevents Privoxy
1487  *                from starting to forward the correctly parsed chunks
1488  *                as soon as theoretically possible.
1489  *
1490  *                Should be modified to work with a common buffer,
1491  *                and allow the caller to skip already parsed chunks.
1492  *
1493  *                This would allow the function to be used for unbuffered
1494  *                response bodies as well.
1495  *
1496  * Parameters  :
1497  *          1  :  iob = Buffer with the body to check.
1498  *          2  :  length = Length of complete body
1499  *
1500  * Returns     :  Enum with the result of the check.
1501  *
1502  *********************************************************************/
1503 static enum chunk_status chunked_body_is_complete(struct iob *iob, size_t *length)
1504 {
1505    unsigned int chunksize;
1506    char *p = iob->cur;
1507
1508    do
1509    {
1510       /*
1511        * We need at least a single digit, followed by "\r\n",
1512        * followed by an unknown amount of data, followed by "\r\n".
1513        */
1514       if (p + 5 > iob->eod)
1515       {
1516          return CHUNK_STATUS_MISSING_DATA;
1517       }
1518       if (sscanf(p, "%x", &chunksize) != 1)
1519       {
1520          return CHUNK_STATUS_PARSE_ERROR;
1521       }
1522
1523       /*
1524        * We want at least a single digit, followed by "\r\n",
1525        * followed by the specified amount of data, followed by "\r\n".
1526        */
1527       if (p + chunksize + 5 > iob->eod)
1528       {
1529          return CHUNK_STATUS_MISSING_DATA;
1530       }
1531
1532       /* Skip chunk-size. */
1533       p = strstr(p, "\r\n");
1534       if (NULL == p)
1535       {
1536          return CHUNK_STATUS_PARSE_ERROR;
1537       }
1538       /* Move beyond the chunkdata. */
1539       p += 2 + chunksize;
1540
1541       /* Make sure we're still within the buffer and have two bytes left */
1542       if (p + 2 > iob->eod)
1543       {
1544          return CHUNK_STATUS_MISSING_DATA;
1545       }
1546
1547       /* There should be another "\r\n" to skip */
1548       if (memcmp(p, "\r\n", 2))
1549       {
1550          return CHUNK_STATUS_PARSE_ERROR;
1551       }
1552       p += 2;
1553    } while (chunksize > 0U);
1554
1555    *length = (size_t)(p - iob->cur);
1556    assert(*length <= (size_t)(iob->eod - iob->cur));
1557    assert(p <= iob->eod);
1558
1559    return CHUNK_STATUS_BODY_COMPLETE;
1560
1561 }
1562
1563
1564 /*********************************************************************
1565  *
1566  * Function    : receive_chunked_client_request_body
1567  *
1568  * Description : Read the chunk-encoded client request body.
1569  *               Failures are dealt with.
1570  *
1571  * Parameters  :
1572  *          1  :  csp = Current client state (buffers, headers, etc...)
1573  *
1574  * Returns     :  JB_ERR_OK or JB_ERR_PARSE
1575  *
1576  *********************************************************************/
1577 static jb_err receive_chunked_client_request_body(struct client_state *csp)
1578 {
1579    size_t body_length;
1580    enum chunk_status status;
1581
1582    while (CHUNK_STATUS_MISSING_DATA ==
1583       (status = chunked_body_is_complete(csp->client_iob, &body_length)))
1584    {
1585       char buf[BUFFER_SIZE];
1586       int len;
1587
1588       if (!data_is_available(csp->cfd, csp->config->socket_timeout))
1589       {
1590          log_error(LOG_LEVEL_ERROR,
1591             "Timeout while waiting for the client body.");
1592          break;
1593       }
1594       len = read_socket(csp->cfd, buf, sizeof(buf) - 1);
1595       if (len <= 0)
1596       {
1597          log_error(LOG_LEVEL_ERROR,
1598             "Reading the client body failed: %E");
1599          break;
1600       }
1601       if (add_to_iob(csp->client_iob, csp->config->buffer_limit, buf, len))
1602       {
1603          break;
1604       }
1605    }
1606    if (status != CHUNK_STATUS_BODY_COMPLETE)
1607    {
1608       write_socket_delayed(csp->cfd, CLIENT_BODY_PARSE_ERROR_RESPONSE,
1609          strlen(CLIENT_BODY_PARSE_ERROR_RESPONSE), get_write_delay(csp));
1610       log_error(LOG_LEVEL_CLF,
1611          "%s - - [%T] \"Failed reading chunked client body\" 400 0", csp->ip_addr_str);
1612       return JB_ERR_PARSE;
1613    }
1614    log_error(LOG_LEVEL_CONNECT,
1615       "Chunked client body completely read. Length: %lu", body_length);
1616    csp->expected_client_content_length = body_length;
1617
1618    return JB_ERR_OK;
1619
1620 }
1621
1622
1623 #ifdef FUZZ
1624 /*********************************************************************
1625  *
1626  * Function    :  fuzz_chunked_transfer_encoding
1627  *
1628  * Description :  Treat the fuzzed input as chunked transfer encoding
1629  *                to check and dechunk.
1630  *
1631  * Parameters  :
1632  *          1  :  csp      = Used to store the data.
1633  *          2  :  fuzz_input_file = File to read the input from.
1634  *
1635  * Returns     : Result of dechunking
1636  *
1637  *********************************************************************/
1638 extern int fuzz_chunked_transfer_encoding(struct client_state *csp, char *fuzz_input_file)
1639 {
1640    size_t length;
1641    size_t size = (size_t)(csp->iob->eod - csp->iob->cur);
1642    enum chunk_status status;
1643
1644    status = chunked_body_is_complete(csp->iob, &length);
1645    if (CHUNK_STATUS_BODY_COMPLETE != status)
1646    {
1647       log_error(LOG_LEVEL_INFO, "Chunked body is incomplete or invalid");
1648    }
1649
1650    return (JB_ERR_OK == remove_chunked_transfer_coding(csp->iob->cur, &size));
1651
1652 }
1653
1654
1655 /*********************************************************************
1656  *
1657  * Function    : fuzz_client_request
1658  *
1659  * Description : Try to get a client request from the fuzzed input.
1660  *
1661  * Parameters  :
1662  *          1  :  csp = Current client state (buffers, headers, etc...)
1663  *          2  :  fuzz_input_file = File to read the input from.
1664  *
1665  * Returns     :  Result of fuzzing.
1666  *
1667  *********************************************************************/
1668 extern int fuzz_client_request(struct client_state *csp, char *fuzz_input_file)
1669 {
1670    jb_err err;
1671
1672    csp->cfd = 0;
1673    csp->ip_addr_str = "fuzzer";
1674
1675    if (strcmp(fuzz_input_file, "-") != 0)
1676    {
1677       log_error(LOG_LEVEL_FATAL,
1678          "Fuzzed client requests can currently only be read from stdin (-).");
1679    }
1680    err = receive_client_request(csp);
1681    if (err != JB_ERR_OK)
1682    {
1683       return 1;
1684    }
1685    err = parse_client_request(csp);
1686    if (err != JB_ERR_OK)
1687    {
1688       return 1;
1689    }
1690
1691    return 0;
1692
1693 }
1694 #endif  /* def FUZZ */
1695
1696
1697 #ifdef FEATURE_FORCE_LOAD
1698 /*********************************************************************
1699  *
1700  * Function    :  force_required
1701  *
1702  * Description : Checks a request line to see if it contains
1703  *               the FORCE_PREFIX. If it does, it is removed
1704  *               unless enforcing requests has beend disabled.
1705  *
1706  * Parameters  :
1707  *          1  :  request_line = HTTP request line
1708  *
1709  * Returns     :  TRUE if force is required, FALSE otherwise.
1710  *
1711  *********************************************************************/
1712 static int force_required(const struct client_state *csp, char *request_line)
1713 {
1714    char *p;
1715
1716    p = strstr(request_line, "http://");
1717    if (p != NULL)
1718    {
1719       /* Skip protocol */
1720       p += strlen("http://");
1721    }
1722    else
1723    {
1724       /* Intercepted request usually don't specify the protocol. */
1725       p = request_line;
1726    }
1727
1728    /* Go to the beginning of the path */
1729    p = strstr(p, "/");
1730    if (p == NULL)
1731    {
1732       /*
1733        * If the path is missing the request line is invalid and we
1734        * are done here. The client-visible rejection happens later on.
1735        */
1736       return 0;
1737    }
1738
1739    if (0 == strncmpic(p, FORCE_PREFIX, strlen(FORCE_PREFIX) - 1))
1740    {
1741       if (!(csp->config->feature_flags & RUNTIME_FEATURE_ENFORCE_BLOCKS))
1742       {
1743          /* XXX: Should clean more carefully */
1744          strclean(request_line, FORCE_PREFIX);
1745          log_error(LOG_LEVEL_FORCE,
1746             "Enforcing request: \"%s\".", request_line);
1747
1748          return 1;
1749       }
1750       log_error(LOG_LEVEL_FORCE,
1751          "Ignored force prefix in request: \"%s\".", request_line);
1752    }
1753
1754    return 0;
1755
1756 }
1757 #endif /* def FEATURE_FORCE_LOAD */
1758
1759
1760 /*********************************************************************
1761  *
1762  * Function    :  receive_client_request
1763  *
1764  * Description : Read the client's request (more precisely the
1765  *               client headers) and answer it if necessary.
1766  *
1767  * Parameters  :
1768  *          1  :  csp = Current client state (buffers, headers, etc...)
1769  *
1770  * Returns     :  JB_ERR_OK, JB_ERR_PARSE or JB_ERR_MEMORY
1771  *
1772  *********************************************************************/
1773 static jb_err receive_client_request(struct client_state *csp)
1774 {
1775    char buf[BUFFER_SIZE];
1776    char *p;
1777    char *req = NULL;
1778    struct http_request *http;
1779    int len;
1780    jb_err err;
1781
1782    /* Temporary copy of the client's headers before they get enlisted in csp->headers */
1783    struct list header_list;
1784    struct list *headers = &header_list;
1785
1786    /* We don't care if the arriving data is a valid HTTP request or not. */
1787    csp->requests_received_total++;
1788
1789    http = csp->http;
1790
1791    memset(buf, 0, sizeof(buf));
1792
1793    req = get_request_line(csp);
1794    if (req == NULL)
1795    {
1796       mark_server_socket_tainted(csp);
1797       return JB_ERR_PARSE;
1798    }
1799    assert(*req != '\0');
1800
1801    if (client_protocol_is_unsupported(csp, req))
1802    {
1803       return JB_ERR_PARSE;
1804    }
1805
1806 #ifdef FEATURE_FORCE_LOAD
1807    if (force_required(csp, req))
1808    {
1809       csp->flags |= CSP_FLAG_FORCED;
1810    }
1811 #endif /* def FEATURE_FORCE_LOAD */
1812
1813    err = parse_http_request(req, http);
1814    freez(req);
1815    if (JB_ERR_OK != err)
1816    {
1817       write_socket_delayed(csp->cfd, CHEADER, strlen(CHEADER),
1818          get_write_delay(csp));
1819       /* XXX: Use correct size */
1820       log_error(LOG_LEVEL_CLF, "%s - - [%T] \"Invalid request\" 400 0", csp->ip_addr_str);
1821       log_error(LOG_LEVEL_ERROR,
1822          "Couldn't parse request line received from %s: %s",
1823          csp->ip_addr_str, jb_err_to_string(err));
1824
1825       free_http_request(http);
1826       return JB_ERR_PARSE;
1827    }
1828    if (http->ssl && strcmpic(http->gpc, "CONNECT"))
1829    {
1830       write_socket_delayed(csp->cfd, CHEADER, strlen(CHEADER),
1831          get_write_delay(csp));
1832       /* XXX: Use correct size */
1833       log_error(LOG_LEVEL_CLF, "%s - - [%T] \"Invalid request\" 400 0",
1834          csp->ip_addr_str);
1835       log_error(LOG_LEVEL_ERROR, "Client %s tried to send a https "
1836          "URL without sending a CONNECT request first",
1837          csp->ip_addr_str);
1838       free_http_request(http);
1839       return JB_ERR_PARSE;
1840    }
1841
1842    /* grab the rest of the client's headers */
1843    init_list(headers);
1844    for (;;)
1845    {
1846       p = get_header(csp->client_iob);
1847
1848       if (p == NULL)
1849       {
1850          /* There are no additional headers to read. */
1851          break;
1852       }
1853
1854       if (*p == '\0')
1855       {
1856          /*
1857           * We didn't receive a complete header
1858           * line yet, get the rest of it.
1859           */
1860          if (!data_is_available(csp->cfd, csp->config->socket_timeout))
1861          {
1862             log_error(LOG_LEVEL_ERROR,
1863                "Client headers did not arrive in time. Timeout: %d",
1864                csp->config->socket_timeout);
1865             destroy_list(headers);
1866             return JB_ERR_PARSE;
1867          }
1868
1869          len = read_socket(csp->cfd, buf, sizeof(buf) - 1);
1870          if (len <= 0)
1871          {
1872             log_error(LOG_LEVEL_ERROR, "read from client failed: %E");
1873             destroy_list(headers);
1874             return JB_ERR_PARSE;
1875          }
1876
1877          if (add_to_iob(csp->client_iob, csp->config->buffer_limit, buf, len))
1878          {
1879             /*
1880              * If there is no memory left for buffering the
1881              * request, there is nothing we can do but hang up
1882              */
1883             destroy_list(headers);
1884             return JB_ERR_MEMORY;
1885          }
1886       }
1887       else
1888       {
1889          if (!strncmpic(p, "Transfer-Encoding:", 18))
1890          {
1891             /*
1892              * XXX: should be called through sed()
1893              *      but currently can't.
1894              */
1895             client_transfer_encoding(csp, &p);
1896          }
1897          /*
1898           * We were able to read a complete
1899           * header and can finally enlist it.
1900           */
1901          enlist(headers, p);
1902          freez(p);
1903       }
1904    }
1905
1906    if (http->host == NULL)
1907    {
1908       /*
1909        * If we still don't know the request destination,
1910        * the request is invalid or the client uses
1911        * Privoxy without its knowledge.
1912        */
1913       if (JB_ERR_OK != get_request_destination_elsewhere(csp, headers))
1914       {
1915          /*
1916           * Our attempts to get the request destination
1917           * elsewhere failed or Privoxy is configured
1918           * to only accept proxy requests.
1919           *
1920           * An error response has already been sent
1921           * and we're done here.
1922           */
1923          return JB_ERR_PARSE;
1924       }
1925    }
1926
1927 #ifdef FEATURE_CLIENT_TAGS
1928    /* XXX: If the headers were enlisted sooner, passing csp would do. */
1929    set_client_address(csp, headers);
1930    get_tag_list_for_client(csp->client_tags, csp->client_address);
1931 #endif
1932
1933    /*
1934     * Determine the actions for this URL
1935     */
1936 #ifdef FEATURE_TOGGLE
1937    if (!(csp->flags & CSP_FLAG_TOGGLED_ON))
1938    {
1939       /* Most compatible set of actions (i.e. none) */
1940       init_current_action(csp->action);
1941    }
1942    else
1943 #endif /* ndef FEATURE_TOGGLE */
1944    {
1945       get_url_actions(csp, http);
1946    }
1947
1948    enlist(csp->headers, http->cmd);
1949
1950    /* Append the previously read headers */
1951    err = list_append_list_unique(csp->headers, headers);
1952    destroy_list(headers);
1953
1954    return err;
1955
1956 }
1957
1958
1959 /*********************************************************************
1960  *
1961  * Function    : parse_client_request
1962  *
1963  * Description : Parses the client's request and decides what to do
1964  *               with it.
1965  *
1966  *               Note that since we're not using select() we could get
1967  *               blocked here if a client connected, then didn't say
1968  *               anything!
1969  *
1970  * Parameters  :
1971  *          1  :  csp = Current client state (buffers, headers, etc...)
1972  *
1973  * Returns     :  JB_ERR_OK or JB_ERR_PARSE
1974  *
1975  *********************************************************************/
1976 static jb_err parse_client_request(struct client_state *csp)
1977 {
1978    struct http_request *http = csp->http;
1979    jb_err err;
1980
1981 #ifdef FEATURE_CONNECTION_KEEP_ALIVE
1982    if ((csp->config->feature_flags & RUNTIME_FEATURE_CONNECTION_KEEP_ALIVE)
1983     && (!strcmpic(csp->http->version, "HTTP/1.1"))
1984     && (csp->http->ssl == 0))
1985    {
1986       /* Assume persistence until further notice */
1987       csp->flags |= CSP_FLAG_CLIENT_CONNECTION_KEEP_ALIVE;
1988    }
1989 #endif /* def FEATURE_CONNECTION_KEEP_ALIVE */
1990
1991    if (csp->http->ssl == 0)
1992    {
1993       /*
1994        * This whole block belongs to chat() but currently
1995        * has to be executed before sed().
1996        */
1997       if (csp->flags & CSP_FLAG_CHUNKED_CLIENT_BODY)
1998       {
1999          if (receive_chunked_client_request_body(csp) != JB_ERR_OK)
2000          {
2001             return JB_ERR_PARSE;
2002          }
2003       }
2004       else
2005       {
2006          csp->expected_client_content_length = get_expected_content_length(csp->headers);
2007       }
2008       verify_request_length(csp);
2009    }
2010 #ifndef FEATURE_HTTPS_INSPECTION
2011    else
2012    {
2013       csp->flags |= CSP_FLAG_SERVER_SOCKET_TAINTED;
2014    }
2015 #endif
2016
2017    err = sed(csp, FILTER_CLIENT_HEADERS);
2018    if (JB_ERR_OK != err)
2019    {
2020       log_error(LOG_LEVEL_ERROR, "Failed to parse client request from %s.",
2021          csp->ip_addr_str);
2022       log_error(LOG_LEVEL_CLF, "%s - - [%T] \"%s\" 400 0",
2023          csp->ip_addr_str, csp->http->cmd);
2024       write_socket_delayed(csp->cfd, CHEADER, strlen(CHEADER), get_write_delay(csp));
2025       return JB_ERR_PARSE;
2026    }
2027    csp->flags |= CSP_FLAG_CLIENT_HEADER_PARSING_DONE;
2028
2029    /* Check request line for rewrites. */
2030    if ((NULL == csp->headers->first->str)
2031       || (strcmp(http->cmd, csp->headers->first->str) &&
2032          (JB_ERR_OK != change_request_destination(csp))))
2033    {
2034       /*
2035        * A header filter broke the request line - bail out.
2036        */
2037       write_socket_delayed(csp->cfd, MESSED_UP_REQUEST_RESPONSE,
2038          strlen(MESSED_UP_REQUEST_RESPONSE), get_write_delay(csp));
2039       /* XXX: Use correct size */
2040       log_error(LOG_LEVEL_CLF,
2041          "%s - - [%T] \"Invalid request generated\" 400 0", csp->ip_addr_str);
2042       log_error(LOG_LEVEL_ERROR,
2043          "Invalid request line after applying header filters.");
2044       free_http_request(http);
2045
2046       return JB_ERR_PARSE;
2047    }
2048
2049    if (client_has_unsupported_expectations(csp))
2050    {
2051       return JB_ERR_PARSE;
2052    }
2053
2054    return JB_ERR_OK;
2055
2056 }
2057
2058
2059 /*********************************************************************
2060  *
2061  * Function    : read_http_request_body
2062  *
2063  * Description : Reads remaining request body from the client.
2064  *
2065  * Parameters  :
2066  *          1  :  csp = Current client state (buffers, headers, etc...)
2067  *
2068  * Returns     :  0 on success, anything else is an error.
2069  *
2070  *********************************************************************/
2071 static int read_http_request_body(struct client_state *csp)
2072 {
2073    size_t to_read = csp->expected_client_content_length;
2074    int len;
2075
2076    assert(to_read != 0);
2077
2078    /* check if all data has been already read */
2079    if (to_read <= (csp->client_iob->eod - csp->client_iob->cur))
2080    {
2081       return 0;
2082    }
2083
2084    for (to_read -= (size_t)(csp->client_iob->eod - csp->client_iob->cur);
2085         to_read > 0 && data_is_available(csp->cfd, csp->config->socket_timeout);
2086         to_read -= (unsigned)len)
2087    {
2088       char buf[BUFFER_SIZE];
2089       size_t max_bytes_to_read = to_read < sizeof(buf) ? to_read : sizeof(buf);
2090
2091       log_error(LOG_LEVEL_CONNECT,
2092          "Waiting for up to %lu bytes of request body from the client.",
2093          max_bytes_to_read);
2094       len = read_socket(csp->cfd, buf, (int)max_bytes_to_read);
2095       if (len <= -1)
2096       {
2097          log_error(LOG_LEVEL_CONNECT, "Failed receiving request body from %s: %E", csp->ip_addr_str);
2098          return 1;
2099       }
2100       if (add_to_iob(csp->client_iob, csp->config->buffer_limit, (char *)buf, len))
2101       {
2102          return 1;
2103       }
2104       assert(to_read >= len);
2105    }
2106
2107    if (to_read != 0)
2108    {
2109       log_error(LOG_LEVEL_CONNECT,
2110          "Not enough request body has been read: expected %lu more bytes",
2111          to_read);
2112       return 1;
2113    }
2114    log_error(LOG_LEVEL_CONNECT,
2115       "The last %d bytes of the request body have been read", len);
2116    return 0;
2117 }
2118
2119
2120 /*********************************************************************
2121  *
2122  * Function    : update_client_headers
2123  *
2124  * Description : Updates the HTTP headers from the client request.
2125  *
2126  * Parameters  :
2127  *          1  :  csp = Current client state (buffers, headers, etc...)
2128  *          2  :  new_content_length = new content length value to set
2129  *
2130  * Returns     :  0 on success, anything else is an error.
2131  *
2132  *********************************************************************/
2133 static int update_client_headers(struct client_state *csp, size_t new_content_length)
2134 {
2135    static const char content_length[] = "Content-Length:";
2136    int updated = 0;
2137    struct list_entry *p;
2138
2139 #ifndef FEATURE_HTTPS_INSPECTION
2140    for (p = csp->headers->first;
2141 #else
2142    for (p = csp->http->client_ssl ? csp->https_headers->first : csp->headers->first;
2143 #endif
2144         !updated  && (p != NULL); p = p->next)
2145    {
2146       /* Header crunch()ed in previous run? -> ignore */
2147       if (p->str == NULL)
2148       {
2149          continue;
2150       }
2151
2152       /* Does the current parser handle this header? */
2153       if (0 == strncmpic(p->str, content_length, sizeof(content_length) - 1))
2154       {
2155          updated = (JB_ERR_OK == header_adjust_content_length((char **)&(p->str), new_content_length));
2156          if (!updated)
2157          {
2158             return 1;
2159          }
2160       }
2161    }
2162
2163    return !updated;
2164 }
2165
2166
2167 /*********************************************************************
2168  *
2169  * Function    : can_filter_request_body
2170  *
2171  * Description : Checks if the current request body can be stored in
2172  *               the client_iob without hitting buffer limit.
2173  *
2174  * Parameters  :
2175  *          1  : csp = Current client state (buffers, headers, etc...)
2176  *
2177  * Returns     : TRUE if the current request size do not exceed buffer limit
2178  *               FALSE otherwise.
2179  *
2180  *********************************************************************/
2181 static int can_filter_request_body(const struct client_state *csp)
2182 {
2183    if (!can_add_to_iob(csp->client_iob, csp->config->buffer_limit,
2184                        csp->expected_client_content_length))
2185    {
2186       log_error(LOG_LEVEL_INFO,
2187          "Not filtering request body from %s: buffer limit %lu will be exceeded "
2188          "(content length %llu)", csp->ip_addr_str, csp->config->buffer_limit,
2189          csp->expected_client_content_length);
2190       return FALSE;
2191    }
2192    return TRUE;
2193 }
2194
2195
2196 /*********************************************************************
2197  *
2198  * Function    : send_http_request
2199  *
2200  * Description : Sends the HTTP headers from the client request
2201  *               and all the body data that has already been received.
2202  *
2203  * Parameters  :
2204  *          1  :  csp = Current client state (buffers, headers, etc...)
2205  *
2206  * Returns     :  0 on success, anything else is an error.
2207  *
2208  *********************************************************************/
2209 static int send_http_request(struct client_state *csp)
2210 {
2211    char *hdr;
2212    int write_failure;
2213    const char *to_send;
2214    size_t to_send_len;
2215    int filter_client_body = csp->expected_client_content_length != 0 &&
2216       client_body_filters_enabled(csp->action) && can_filter_request_body(csp);
2217
2218    if (filter_client_body)
2219    {
2220       if (read_http_request_body(csp))
2221       {
2222          return 1;
2223       }
2224       to_send_len = csp->expected_client_content_length;
2225       to_send = execute_client_body_filters(csp, &to_send_len);
2226       if (to_send == NULL)
2227       {
2228          /* just flush client_iob */
2229          filter_client_body = FALSE;
2230       }
2231       else if (to_send_len != csp->expected_client_content_length &&
2232          update_client_headers(csp, to_send_len))
2233       {
2234          log_error(LOG_LEVEL_HEADER, "Error updating client headers");
2235          freez(to_send);
2236          return 1;
2237       }
2238       csp->expected_client_content_length = 0;
2239    }
2240
2241    hdr = list_to_text(csp->headers);
2242    if (hdr == NULL)
2243    {
2244       /* FIXME Should handle error properly */
2245       log_error(LOG_LEVEL_FATAL, "Out of memory parsing client header");
2246    }
2247    list_remove_all(csp->headers);
2248
2249    /*
2250     * Write the client's (modified) header to the server
2251     * (along with anything else that may be in the buffer)
2252     */
2253    write_failure = 0 != write_socket(csp->server_connection.sfd, hdr, strlen(hdr));
2254    freez(hdr);
2255
2256    if (write_failure)
2257    {
2258       log_error(LOG_LEVEL_CONNECT, "Failed sending request headers to: %s: %E",
2259          csp->http->hostport);
2260       if (filter_client_body)
2261       {
2262          freez(to_send);
2263       }
2264       return 1;
2265    }
2266
2267    if (filter_client_body)
2268    {
2269       write_failure = 0 != write_socket(csp->server_connection.sfd, to_send, to_send_len);
2270       freez(to_send);
2271       if (write_failure)
2272       {
2273          log_error(LOG_LEVEL_CONNECT, "Failed sending filtered request body to: %s: %E",
2274             csp->http->hostport);
2275          return 1;
2276       }
2277    }
2278
2279    if (((csp->flags & CSP_FLAG_PIPELINED_REQUEST_WAITING) == 0)
2280       && (flush_iob(csp->server_connection.sfd, csp->client_iob, 0) < 0))
2281    {
2282       log_error(LOG_LEVEL_CONNECT, "Failed sending request body to: %s: %E",
2283          csp->http->hostport);
2284       return 1;
2285    }
2286    return 0;
2287 }
2288
2289
2290 #ifdef FEATURE_HTTPS_INSPECTION
2291 /*********************************************************************
2292  *
2293  * Function    : read_https_request_body
2294  *
2295  * Description : Reads remaining request body from the client.
2296  *
2297  * Parameters  :
2298  *          1  :  csp = Current client state (buffers, headers, etc...)
2299  *
2300  * Returns     :  0 on success, anything else is an error.
2301  *
2302  *********************************************************************/
2303 static int read_https_request_body(struct client_state *csp)
2304 {
2305    size_t to_read = csp->expected_client_content_length;
2306    int len;
2307
2308    assert(to_read != 0);
2309
2310    /* check if all data has been already read */
2311    if (to_read <= (csp->client_iob->eod - csp->client_iob->cur))
2312    {
2313       return 0;
2314    }
2315
2316    for (to_read -= (size_t)(csp->client_iob->eod - csp->client_iob->cur);
2317         to_read > 0 && (is_ssl_pending(&(csp->ssl_client_attr)) ||
2318           data_is_available(csp->cfd, csp->config->socket_timeout));
2319         to_read -= (unsigned)len)
2320    {
2321       unsigned char buf[BUFFER_SIZE];
2322       size_t max_bytes_to_read = to_read < sizeof(buf) ? to_read : sizeof(buf);
2323
2324       log_error(LOG_LEVEL_CONNECT,
2325          "Waiting for up to %lu bytes of request body from the client.",
2326          max_bytes_to_read);
2327       len = ssl_recv_data(&(csp->ssl_client_attr), buf,
2328          (unsigned)max_bytes_to_read);
2329       if (len <= 0)
2330       {
2331          log_error(LOG_LEVEL_CONNECT, "Failed receiving request body from %s", csp->ip_addr_str);
2332          return 1;
2333       }
2334       if (add_to_iob(csp->client_iob, csp->config->buffer_limit, (char *)buf, len))
2335       {
2336          return 1;
2337       }
2338       assert(to_read >= len);
2339    }
2340
2341    if (to_read != 0)
2342    {
2343       log_error(LOG_LEVEL_CONNECT,
2344          "Not enough request body has been read: expected %lu more bytes",
2345          to_read);
2346       return 1;
2347    }
2348
2349    log_error(LOG_LEVEL_CONNECT,
2350       "The last %llu bytes of the request body have been read",
2351       csp->expected_client_content_length);
2352    return 0;
2353 }
2354
2355
2356 /*********************************************************************
2357  *
2358  * Function    : receive_and_send_encrypted_post_data
2359  *
2360  * Description : Reads remaining request body from the client and sends
2361  *               it to the server.
2362  *
2363  * Parameters  :
2364  *          1  :  csp = Current client state (buffers, headers, etc...)
2365  *
2366  * Returns     :  0 on success, anything else is an error.
2367  *
2368  *********************************************************************/
2369 static int receive_and_send_encrypted_post_data(struct client_state *csp)
2370 {
2371    int content_length_known = csp->expected_client_content_length != 0;
2372
2373    while (is_ssl_pending(&(csp->ssl_client_attr))
2374       || (content_length_known && csp->expected_client_content_length != 0))
2375    {
2376       unsigned char buf[BUFFER_SIZE];
2377       int len;
2378       int max_bytes_to_read = sizeof(buf);
2379
2380       if (content_length_known && csp->expected_client_content_length < sizeof(buf))
2381       {
2382          max_bytes_to_read = (int)csp->expected_client_content_length;
2383       }
2384       log_error(LOG_LEVEL_CONNECT,
2385          "Waiting for up to %d bytes of request body from the client.",
2386          max_bytes_to_read);
2387       len = ssl_recv_data(&(csp->ssl_client_attr), buf,
2388          (unsigned)max_bytes_to_read);
2389       if (len == -1)
2390       {
2391          return 1;
2392       }
2393       if (len == 0)
2394       {
2395          /* XXX: Does this actually happen? */
2396          break;
2397       }
2398       log_error(LOG_LEVEL_CONNECT, "Forwarding %d bytes of encrypted request body",
2399          len);
2400       len = ssl_send_data(&(csp->ssl_server_attr), buf, (size_t)len);
2401       if (len == -1)
2402       {
2403          return 1;
2404       }
2405       if (csp->expected_client_content_length != 0)
2406       {
2407          if (csp->expected_client_content_length >= len)
2408          {
2409             csp->expected_client_content_length -= (unsigned)len;
2410          }
2411          if (csp->expected_client_content_length == 0)
2412          {
2413             log_error(LOG_LEVEL_CONNECT, "Forwarded the last %d bytes", len);
2414             break;
2415          }
2416       }
2417    }
2418
2419    log_error(LOG_LEVEL_CONNECT, "Done forwarding encrypted request body");
2420
2421    return 0;
2422
2423 }
2424
2425
2426 /*********************************************************************
2427  *
2428  * Function    : send_https_request
2429  *
2430  * Description : Sends the HTTP headers from the client request
2431  *               and all the body data that has already been received.
2432  *
2433  * Parameters  :
2434  *          1  :  csp = Current client state (buffers, headers, etc...)
2435  *
2436  * Returns     :  0 on success, anything else is an error.
2437  *
2438  *********************************************************************/
2439 static int send_https_request(struct client_state *csp)
2440 {
2441    char *hdr;
2442    int ret;
2443    long flushed = 0;
2444    const char *to_send;
2445    size_t to_send_len;
2446    int filter_client_body = csp->expected_client_content_length != 0 &&
2447       client_body_filters_enabled(csp->action) && can_filter_request_body(csp);
2448
2449    if (filter_client_body)
2450    {
2451       if (read_https_request_body(csp))
2452       {
2453          return 1;
2454       }
2455       to_send_len = csp->expected_client_content_length;
2456       to_send = execute_client_body_filters(csp, &to_send_len);
2457       if (to_send == NULL)
2458       {
2459          /* just flush client_iob */
2460          filter_client_body = FALSE;
2461       }
2462       else if (to_send_len != csp->expected_client_content_length &&
2463          update_client_headers(csp, to_send_len))
2464       {
2465          log_error(LOG_LEVEL_HEADER, "Error updating client headers");
2466          return 1;
2467       }
2468       csp->expected_client_content_length = 0;
2469    }
2470
2471    hdr = list_to_text(csp->https_headers);
2472    if (hdr == NULL)
2473    {
2474       /* FIXME Should handle error properly */
2475       log_error(LOG_LEVEL_FATAL, "Out of memory parsing client header");
2476    }
2477    list_remove_all(csp->https_headers);
2478
2479    /*
2480     * Write the client's (modified) header to the server
2481     * (along with anything else that may be in the buffer)
2482     */
2483    ret = ssl_send_data(&(csp->ssl_server_attr),
2484       (const unsigned char *)hdr, strlen(hdr));
2485    freez(hdr);
2486
2487    if (ret < 0)
2488    {
2489       log_error(LOG_LEVEL_CONNECT,
2490          "Failed sending encrypted request headers to: %s: %E",
2491          csp->http->hostport);
2492       mark_server_socket_tainted(csp);
2493       return 1;
2494    }
2495
2496    if (filter_client_body)
2497    {
2498       ret = ssl_send_data(&(csp->ssl_server_attr), (const unsigned char *)to_send, to_send_len);
2499       freez(to_send);
2500       if (ret < 0)
2501       {
2502          log_error(LOG_LEVEL_CONNECT, "Failed sending filtered request body to: %s",
2503             csp->http->hostport);
2504          return 1;
2505       }
2506    }
2507
2508    if (((csp->flags & CSP_FLAG_PIPELINED_REQUEST_WAITING) == 0)
2509       && ((flushed = ssl_flush_socket(&(csp->ssl_server_attr),
2510             csp->client_iob)) < 0))
2511    {
2512       log_error(LOG_LEVEL_CONNECT, "Failed sending request body to: %s: %E",
2513          csp->http->hostport);
2514       return 1;
2515    }
2516    if (flushed != 0 || csp->expected_client_content_length != 0)
2517    {
2518       if (csp->expected_client_content_length != 0)
2519       {
2520          if (csp->expected_client_content_length < flushed)
2521          {
2522             log_error(LOG_LEVEL_ERROR,
2523                "Flushed %ld bytes of request body while only expecting %llu",
2524                flushed, csp->expected_client_content_length);
2525             csp->expected_client_content_length = 0;
2526          }
2527          else
2528          {
2529             log_error(LOG_LEVEL_CONNECT,
2530                "Flushed %ld bytes of request body while expecting %llu",
2531                flushed, csp->expected_client_content_length);
2532             csp->expected_client_content_length -= (unsigned)flushed;
2533             if (receive_and_send_encrypted_post_data(csp))
2534             {
2535                return 1;
2536             }
2537          }
2538       }
2539       else
2540       {
2541          log_error(LOG_LEVEL_CONNECT,
2542             "Flushed %ld bytes of request body", flushed);
2543       }
2544    }
2545
2546    log_error(LOG_LEVEL_CONNECT, "Encrypted request sent");
2547
2548    return 0;
2549
2550 }
2551
2552
2553 /*********************************************************************
2554  *
2555  * Function    :  receive_encrypted_request_headers
2556  *
2557  * Description :  Receives the encrypted request headers when
2558  *                https-inspecting.
2559  *
2560  * Parameters  :
2561  *          1  :  csp = Current client state (buffers, headers, etc...)
2562  *
2563  * Returns     :  JB_ERR_OK on success,
2564  *                JB_ERR_PARSE or JB_ERR_MEMORY otherwise
2565  *
2566  *********************************************************************/
2567 static jb_err receive_encrypted_request_headers(struct client_state *csp)
2568 {
2569    char buf[BUFFER_SIZE];
2570    int len;
2571    char *p;
2572
2573    do
2574    {
2575       log_error(LOG_LEVEL_HEADER, "Waiting for encrypted client headers");
2576       if (!is_ssl_pending(&(csp->ssl_client_attr)) &&
2577           !data_is_available(csp->cfd, csp->config->socket_timeout))
2578       {
2579          log_error(LOG_LEVEL_CONNECT,
2580             "Socket %d timed out while waiting for client headers", csp->cfd);
2581          return JB_ERR_PARSE;
2582       }
2583       len = ssl_recv_data(&(csp->ssl_client_attr),
2584          (unsigned char *)buf, sizeof(buf));
2585       if (len == 0)
2586       {
2587          log_error(LOG_LEVEL_CONNECT,
2588             "Socket %d closed while waiting for client headers", csp->cfd);
2589          return JB_ERR_PARSE;
2590       }
2591       if (len == -1)
2592       {
2593          return JB_ERR_PARSE;
2594       }
2595       if (add_to_iob(csp->client_iob, csp->config->buffer_limit, buf, len))
2596       {
2597          return JB_ERR_MEMORY;
2598       }
2599       p = strstr(csp->client_iob->cur, "\r\n\r\n");
2600    } while (p == NULL);
2601
2602    log_error(LOG_LEVEL_HEADER, "Encrypted headers received completely");
2603
2604    return JB_ERR_OK;
2605 }
2606
2607
2608 /*********************************************************************
2609  *
2610  * Function    :  change_encrypted_request_destination
2611  *
2612  * Description :  Parse a (rewritten) request line from an encrypted
2613  *                request and regenerate the http request data.
2614  *
2615  * Parameters  :
2616  *          1  :  csp = Current client state (buffers, headers, etc...)
2617  *
2618  * Returns     :  Forwards the parse_http_request() return code.
2619  *                Terminates in case of memory problems.
2620  *
2621  *********************************************************************/
2622 static jb_err change_encrypted_request_destination(struct client_state *csp)
2623 {
2624    jb_err err;
2625    char *original_host = csp->http->host;
2626    int original_port = csp->http->port;
2627
2628    log_error(LOG_LEVEL_REDIRECTS, "Rewrite detected: %s",
2629       csp->https_headers->first->str);
2630    csp->http->host = NULL;
2631    free_http_request(csp->http);
2632    err = parse_http_request(csp->https_headers->first->str, csp->http);
2633    if (JB_ERR_OK != err)
2634    {
2635       log_error(LOG_LEVEL_ERROR, "Couldn't parse rewritten request: %s.",
2636          jb_err_to_string(err));
2637       freez(original_host);
2638       return err;
2639    }
2640
2641    if (csp->http->host == NULL)
2642    {
2643       char port_string[10];
2644       /*
2645        * The rewritten request line did not specify a host
2646        * which means we can use the original host specified
2647        * by the client.
2648        */
2649       csp->http->host = original_host;
2650       csp->http->port = original_port;
2651       log_error(LOG_LEVEL_REDIRECTS, "Keeping the original host: %s",
2652          csp->http->host);
2653       /*
2654        * If the rewritten request line didn't contain a host
2655        * it also didn't contain a port so we can reuse the host
2656        * port.
2657        */
2658       freez(csp->http->hostport);
2659       csp->http->hostport = strdup_or_die(csp->http->host);
2660       snprintf(port_string, sizeof(port_string), ":%d", original_port);
2661       err = string_append(&csp->http->hostport, port_string);
2662       if (err != JB_ERR_OK)
2663       {
2664          log_error(LOG_LEVEL_ERROR, "Failed to rebuild hostport: %s.",
2665             jb_err_to_string(err));
2666          return err;
2667       }
2668
2669       /*
2670        * While the request line didn't mention it,
2671        * we're https-inspecting and want to speak TLS
2672        * with the server.
2673        */
2674       csp->http->server_ssl = 1;
2675       csp->http->ssl = 1;
2676    }
2677    else
2678    {
2679       /* The rewrite filter added a host so we can ditch the original */
2680       freez(original_host);
2681       csp->http->server_ssl = csp->http->ssl;
2682    }
2683
2684    csp->http->client_ssl = 1;
2685
2686    freez(csp->https_headers->first->str);
2687    build_request_line(csp, NULL, &csp->https_headers->first->str);
2688
2689    if (!server_use_ssl(csp))
2690    {
2691       log_error(LOG_LEVEL_REDIRECTS,
2692          "Rewritten request line results in downgrade to http");
2693       /*
2694        * Replace the unencryptd headers received with the
2695        * CONNECT request with the ones we received securely.
2696        */
2697       destroy_list(csp->headers);
2698       csp->headers->first = csp->https_headers->first;
2699       csp->headers->last  = csp->https_headers->last;
2700       csp->https_headers->first = NULL;
2701       csp->https_headers->last = NULL;
2702    }
2703
2704    return JB_ERR_OK;
2705
2706 }
2707
2708
2709 /*********************************************************************
2710  *
2711  * Function    :  process_encrypted_request_headers
2712  *
2713  * Description :  Receives and parses the encrypted headers send
2714  *                by the client when https-inspecting.
2715  *
2716  * Parameters  :
2717  *          1  :  csp = Current client state (buffers, headers, etc...)
2718  *
2719  * Returns     :  JB_ERR_OK on success,
2720  *                JB_ERR_PARSE or JB_ERR_MEMORY otherwise
2721  *
2722  *********************************************************************/
2723 static jb_err process_encrypted_request_headers(struct client_state *csp)
2724 {
2725    char *p;
2726    char *request_line;
2727    jb_err err;
2728    /* Temporary copy of the client's headers before they get enlisted in csp->https_headers */
2729    struct list header_list;
2730    struct list *headers = &header_list;
2731
2732    assert(csp->ssl_with_client_is_opened);
2733
2734 #ifdef FEATURE_CONNECTION_KEEP_ALIVE
2735    if (csp->config->feature_flags & RUNTIME_FEATURE_CONNECTION_KEEP_ALIVE)
2736    {
2737       csp->flags |= CSP_FLAG_CLIENT_CONNECTION_KEEP_ALIVE;
2738    }
2739 #endif
2740    err = receive_encrypted_request_headers(csp);
2741    if (err != JB_ERR_OK)
2742    {
2743       if (csp->client_iob->cur == NULL ||
2744           csp->client_iob->cur == csp->client_iob->eod)
2745       {
2746          /*
2747           * We did not receive any data, most likely because the
2748           * client is done. Don't log this as a parse failure.
2749           */
2750          return JB_ERR_PARSE;
2751       }
2752       /* XXX: Also used for JB_ERR_MEMORY */
2753       log_error(LOG_LEVEL_ERROR, "Failed to receive encrypted request: %s",
2754          jb_err_to_string(err));
2755       ssl_send_data_delayed(&(csp->ssl_client_attr),
2756          (const unsigned char *)CHEADER, strlen(CHEADER), get_write_delay(csp));
2757       return err;
2758    }
2759
2760    /* We don't need get_request_line() because the whole HTTP head is buffered. */
2761    request_line = get_header(csp->client_iob);
2762    if (request_line == NULL)
2763    {
2764       log_error(LOG_LEVEL_ERROR, "Failed to get the encrypted request line");
2765       ssl_send_data_delayed(&(csp->ssl_client_attr),
2766          (const unsigned char *)CHEADER, strlen(CHEADER), get_write_delay(csp));
2767       return JB_ERR_PARSE;
2768    }
2769    assert(*request_line != '\0');
2770
2771    if (client_protocol_is_unsupported(csp, request_line))
2772    {
2773       /*
2774        * If the protocol is unsupported we're done here.
2775        * client_protocol_is_unsupported() took care of sending
2776        * the error response and logging the error message.
2777        */
2778       return JB_ERR_PARSE;
2779    }
2780
2781 #ifdef FEATURE_FORCE_LOAD
2782    if (force_required(csp, request_line))
2783    {
2784       csp->flags |= CSP_FLAG_FORCED;
2785    }
2786 #endif /* def FEATURE_FORCE_LOAD */
2787
2788    free_http_request(csp->http);
2789
2790    err = parse_http_request(request_line, csp->http);
2791    /* XXX: Restore ssl setting. This is ugly */
2792    csp->http->client_ssl = 1;
2793    csp->http->server_ssl = 1;
2794
2795    freez(request_line);
2796    if (JB_ERR_OK != err)
2797    {
2798       ssl_send_data_delayed(&(csp->ssl_client_attr),
2799          (const unsigned char *)CHEADER, strlen(CHEADER), get_write_delay(csp));
2800       /* XXX: Use correct size */
2801       log_error(LOG_LEVEL_CLF, "%s - - [%T] \"Invalid request\" 400 0", csp->ip_addr_str);
2802       log_error(LOG_LEVEL_ERROR,
2803          "Couldn't parse request line received from %s: %s",
2804          csp->ip_addr_str, jb_err_to_string(err));
2805
2806       free_http_request(csp->http);
2807       return JB_ERR_PARSE;
2808    }
2809
2810    /* Parse the rest of the client's headers. */
2811    init_list(headers);
2812    for (;;)
2813    {
2814       p = get_header(csp->client_iob);
2815
2816       if (p == NULL)
2817       {
2818          /* There are no additional headers to read. */
2819          break;
2820       }
2821       enlist(headers, p);
2822       freez(p);
2823    }
2824
2825    if (JB_ERR_OK != get_destination_from_https_headers(headers, csp->http))
2826    {
2827       /*
2828        * Our attempts to get the request destination
2829        * elsewhere failed.
2830        */
2831       log_error(LOG_LEVEL_ERROR,
2832          "Failed to get the encrypted request destination");
2833       ssl_send_data_delayed(&(csp->ssl_client_attr),
2834          (const unsigned char *)CHEADER, strlen(CHEADER), get_write_delay(csp));
2835       destroy_list(headers);
2836
2837       return JB_ERR_PARSE;
2838    }
2839
2840    /* Split the domain we just got for pattern matching */
2841    init_domain_components(csp->http);
2842
2843 #ifdef FEATURE_CLIENT_TAGS
2844    /* XXX: If the headers were enlisted sooner, passing csp would do. */
2845    if (csp->client_address == NULL)
2846    {
2847       set_client_address(csp, headers);
2848       get_tag_list_for_client(csp->client_tags, csp->client_address);
2849    }
2850 #endif
2851
2852 #ifdef FEATURE_TOGGLE
2853    if ((csp->flags & CSP_FLAG_TOGGLED_ON) != 0)
2854 #endif
2855    {
2856       /*
2857        * Determine the actions for this request after
2858        * clearing the ones from the previous one.
2859        */
2860       free_current_action(csp->action);
2861       get_url_actions(csp, csp->http);
2862    }
2863
2864    enlist(csp->https_headers, csp->http->cmd);
2865
2866    /* Append the previously read headers */
2867    err = list_append_list_unique(csp->https_headers, headers);
2868    destroy_list(headers);
2869    if (JB_ERR_OK != err)
2870    {
2871       /* XXX: Send error message */
2872       return err;
2873    }
2874
2875    /* XXX: Work around crash */
2876    csp->error_message = NULL;
2877
2878    /* XXX: Why do this here? */
2879    csp->http->ssl = 1;
2880
2881    err = sed_https(csp);
2882    if (JB_ERR_OK != err)
2883    {
2884       ssl_send_data_delayed(&(csp->ssl_client_attr),
2885          (const unsigned char *)CHEADER, strlen(CHEADER), get_write_delay(csp));
2886       log_error(LOG_LEVEL_ERROR, "Failed to parse client request from %s.",
2887          csp->ip_addr_str);
2888       log_error(LOG_LEVEL_CLF, "%s - - [%T] \"%s\" 400 0",
2889          csp->ip_addr_str, csp->http->cmd);
2890       return JB_ERR_PARSE;
2891    }
2892
2893    if ((NULL == csp->https_headers->first->str)
2894       || (strcmp(csp->http->cmd, csp->https_headers->first->str) &&
2895          (JB_ERR_OK != change_encrypted_request_destination(csp))))
2896    {
2897       ssl_send_data_delayed(&(csp->ssl_client_attr),
2898          (const unsigned char *)MESSED_UP_REQUEST_RESPONSE,
2899          strlen(MESSED_UP_REQUEST_RESPONSE), get_write_delay(csp));
2900       log_error(LOG_LEVEL_ERROR,
2901          "Invalid request line after applying header filters.");
2902       /* XXX: Use correct size */
2903       log_error(LOG_LEVEL_CLF,
2904          "%s - - [%T] \"Invalid request generated\" 400 0", csp->ip_addr_str);
2905
2906       return JB_ERR_PARSE;
2907    }
2908
2909    log_error(LOG_LEVEL_HEADER, "Encrypted request headers processed");
2910    log_error(LOG_LEVEL_REQUEST, "https://%s%s", csp->http->hostport,
2911       csp->http->path);
2912
2913    return err;
2914
2915 }
2916
2917 /*********************************************************************
2918  *
2919  * Function    :  cgi_page_requested
2920  *
2921  * Description :  Checks if a request is for an internal CGI page.
2922  *
2923  * Parameters  :
2924  *          1  :  host = The host requested by the client.
2925  *
2926  * Returns     :  1 if a CGI page has been requested, 0 otherwise
2927  *
2928  *********************************************************************/
2929 static int cgi_page_requested(const char *host)
2930 {
2931    if ((0 == strcmpic(host, CGI_SITE_1_HOST))
2932     || (0 == strcmpic(host, CGI_SITE_1_HOST "."))
2933     || (0 == strcmpic(host, CGI_SITE_2_HOST))
2934     || (0 == strcmpic(host, CGI_SITE_2_HOST ".")))
2935    {
2936       return 1;
2937    }
2938
2939    return 0;
2940
2941 }
2942
2943
2944 #ifdef FEATURE_CONNECTION_KEEP_ALIVE
2945 /*********************************************************************
2946  *
2947  * Function    :  continue_https_chat
2948  *
2949  * Description :  Behaves similar to chat() but only deals with
2950  *                https-inspected requests that arrive on an already
2951  *                established connection. The first request is always
2952  *                served by chat() which is a lot more complex as it
2953  *                has to deal with forwarding settings and connection
2954  *                failures etc.
2955  *
2956  *                If a connection to the server has already been
2957  *                opened it is reused unless the request is blocked
2958  *                or the forwarder changed.
2959  *
2960  *                If a connection to the server has not yet been
2961  *                opened (because the previous request was crunched),
2962  *                or the forwarder changed, the connection is dropped
2963  *                so that the client retries on a fresh one.
2964  *
2965  * Parameters  :
2966  *          1  :  csp = Current client state (buffers, headers, etc...)
2967  *
2968  * Returns     :  Nothing.
2969  *
2970  *********************************************************************/
2971 static void continue_https_chat(struct client_state *csp)
2972 {
2973    const struct forward_spec *fwd;
2974
2975    if (JB_ERR_OK != process_encrypted_request_headers(csp))
2976    {
2977       csp->flags &= ~CSP_FLAG_CLIENT_CONNECTION_KEEP_ALIVE;
2978       return;
2979    }
2980
2981 #if defined(FEATURE_STATISTICS) && defined(MUTEX_LOCKS_AVAILABLE)
2982    privoxy_mutex_lock(&block_statistics_mutex);
2983    number_of_requests_received++;
2984    privoxy_mutex_unlock(&block_statistics_mutex);
2985 #endif
2986
2987    csp->requests_received_total++;
2988
2989    /*
2990     * We have an encrypted request. Check if one of the crunchers wants it.
2991     */
2992    if (crunch_response_triggered(csp, crunchers_all))
2993    {
2994       /*
2995        * Yes. The client got the crunch response and we're done here.
2996        */
2997       return;
2998    }
2999    if (csp->ssl_with_server_is_opened == 0)
3000    {
3001       log_error(LOG_LEVEL_CONNECT,
3002          "Dropping the client connection on socket %d. "
3003          "The server connection has not been established yet.",
3004          csp->cfd);
3005       csp->flags &= ~CSP_FLAG_CLIENT_CONNECTION_KEEP_ALIVE;
3006       return;
3007    }
3008    assert(csp->server_connection.sfd != JB_INVALID_SOCKET);
3009
3010    fwd = forward_url(csp, csp->http);
3011    if (!connection_destination_matches(&csp->server_connection, csp->http, fwd))
3012    {
3013       log_error(LOG_LEVEL_CONNECT,
3014          "Dropping the client connection on socket %d with "
3015          "server socket %d connected to %s. The forwarder has changed.",
3016          csp->cfd, csp->server_connection.sfd, csp->server_connection.host);
3017       csp->flags &= ~CSP_FLAG_CLIENT_CONNECTION_KEEP_ALIVE;
3018       return;
3019    }
3020
3021    log_applied_actions(csp->action);
3022
3023    log_error(LOG_LEVEL_CONNECT,
3024       "Reusing server socket %d connected to %s. Requests already sent: %u.",
3025       csp->server_connection.sfd, csp->server_connection.host,
3026       csp->server_connection.requests_sent_total);
3027
3028    if (send_https_request(csp))
3029    {
3030       /*
3031        * Most likely the server connection timed out. We can't easily
3032        * create a new one so simply drop the client connection without a
3033        * error response to let the client retry.
3034        */
3035       log_error(LOG_LEVEL_CONNECT,
3036          "Dropping client connection on socket %d. "
3037          "Forwarding the encrypted client request failed.",
3038          csp->cfd);
3039       return;
3040    }
3041    csp->server_connection.request_sent = time(NULL);
3042    csp->server_connection.requests_sent_total++;
3043    handle_established_connection(csp);
3044    freez(csp->receive_buffer);
3045 }
3046 #endif /* def FEATURE_CONNECTION_KEEP_ALIVE */
3047 #endif
3048
3049
3050 /*********************************************************************
3051  *
3052  * Function    :  handle_established_connection
3053  *
3054  * Description :  Shuffle data between client and server once the
3055  *                connection has been established and the request
3056  *                has been sent.
3057  *
3058  * Parameters  :
3059  *          1  :  csp = Current client state (buffers, headers, etc...)
3060  *
3061  * Returns     :  Nothing.
3062  *
3063  *********************************************************************/
3064 static void handle_established_connection(struct client_state *csp)
3065 {
3066    char *hdr;
3067    char *p;
3068    int n;
3069 #ifdef HAVE_POLL
3070    struct pollfd poll_fds[2];
3071 #else
3072    fd_set rfds;
3073    jb_socket maxfd;
3074    struct timeval timeout;
3075 #endif
3076    int server_body;
3077    int ms_iis5_hack = 0;
3078    unsigned long long byte_count = 0;
3079    struct http_request *http;
3080    long len = 0; /* for buffer sizes (and negative error codes) */
3081    int buffer_and_filter_content = 0;
3082    unsigned int write_delay;
3083 #ifdef FEATURE_HTTPS_INSPECTION
3084    int ret = 0;
3085    int use_ssl_tunnel = 0;
3086    csp->dont_verify_certificate = 0;
3087
3088    if (csp->http->ssl && !(csp->action->flags & ACTION_HTTPS_INSPECTION))
3089    {
3090       /* Pass encrypted content without filtering. */
3091       use_ssl_tunnel = 1;
3092    }
3093 #endif
3094
3095    /* Skeleton for HTTP response, if we should intercept the request */
3096    struct http_response *rsp;
3097 #ifdef FEATURE_CONNECTION_KEEP_ALIVE
3098    int watch_client_socket;
3099 #endif
3100
3101    csp->receive_buffer_size = csp->config->receive_buffer_size;
3102    csp->receive_buffer = zalloc(csp->receive_buffer_size + 1);
3103    if (csp->receive_buffer == NULL)
3104    {
3105       log_error(LOG_LEVEL_ERROR,
3106          "Out of memory. Failed to allocate the receive buffer.");
3107       rsp = cgi_error_memory();
3108       send_crunch_response(csp, rsp);
3109       return;
3110    }
3111
3112    http = csp->http;
3113
3114 #ifndef HAVE_POLL
3115    maxfd = (csp->cfd > csp->server_connection.sfd) ?
3116       csp->cfd : csp->server_connection.sfd;
3117 #endif
3118
3119    /* pass data between the client and server
3120     * until one or the other shuts down the connection.
3121     */
3122
3123    server_body = 0;
3124
3125 #ifdef FEATURE_CONNECTION_KEEP_ALIVE
3126    watch_client_socket = 0 == (csp->flags & CSP_FLAG_PIPELINED_REQUEST_WAITING);
3127 #endif
3128    write_delay = get_write_delay(csp);
3129
3130    for (;;)
3131    {
3132 #ifdef FEATURE_HTTPS_INSPECTION
3133       if (server_use_ssl(csp) && is_ssl_pending(&(csp->ssl_server_attr)))
3134       {
3135          /*
3136           * It's possible that the TLS library already consumed all the
3137           * data the server intends to send. If that happens poll() and
3138           * select() will no longer see the data as available so we have
3139           * to skip the calls.
3140           */
3141          goto server_wants_to_talk;
3142       }
3143       if (watch_client_socket && client_use_ssl(csp) &&
3144          is_ssl_pending(&(csp->ssl_client_attr)))
3145       {
3146          /*
3147           * The TLS libray may also consume all of the remaining data
3148           * from the client when we're shuffling the data from an
3149           * unbuffered request body to the server.
3150           */
3151          goto client_wants_to_talk;
3152       }
3153 #endif
3154 #ifndef HAVE_POLL
3155       FD_ZERO(&rfds);
3156 #ifdef FEATURE_CONNECTION_KEEP_ALIVE
3157       if (!watch_client_socket)
3158       {
3159          maxfd = csp->server_connection.sfd;
3160       }
3161       else
3162 #endif /* def FEATURE_CONNECTION_KEEP_ALIVE */
3163       {
3164          FD_SET(csp->cfd, &rfds);
3165       }
3166
3167       FD_SET(csp->server_connection.sfd, &rfds);
3168 #endif /* ndef HAVE_POLL */
3169
3170 #ifdef FEATURE_CONNECTION_KEEP_ALIVE
3171       if ((csp->flags & CSP_FLAG_CHUNKED)
3172          && !(csp->flags & CSP_FLAG_CONTENT_LENGTH_SET)
3173          && ((csp->iob->eod - csp->iob->cur) >= 5)
3174          && !memcmp(csp->iob->eod-5, "0\r\n\r\n", 5))
3175       {
3176          /*
3177           * XXX: This check should be obsolete now,
3178           *      but let's wait a while to be sure.
3179           */
3180          log_error(LOG_LEVEL_CONNECT,
3181             "Looks like we got the last chunk together with "
3182             "the server headers but didn't detect it earlier. "
3183             "We better stop reading.");
3184          byte_count = (unsigned long long)(csp->iob->eod - csp->iob->cur);
3185          csp->expected_content_length = byte_count;
3186          csp->flags |= CSP_FLAG_CONTENT_LENGTH_SET;
3187       }
3188       if (server_body && server_response_is_complete(csp, byte_count))
3189       {
3190          if (csp->expected_content_length == byte_count)
3191          {
3192             log_error(LOG_LEVEL_CONNECT,
3193                "Done reading from server. Content length: %llu as expected. "
3194                "Bytes most recently read: %ld.",
3195                byte_count, len);
3196          }
3197          else
3198          {
3199             log_error(LOG_LEVEL_CONNECT,
3200                "Done reading from server. Expected content length: %llu. "
3201                "Actual content length: %llu. Bytes most recently read: %ld.",
3202                csp->expected_content_length, byte_count, len);
3203          }
3204          len = 0;
3205          /*
3206           * XXX: Should not jump around, handle_established_connection()
3207           * is complicated enough already.
3208           */
3209          goto reading_done;
3210       }
3211 #endif  /* FEATURE_CONNECTION_KEEP_ALIVE */
3212
3213 #ifdef HAVE_POLL
3214       poll_fds[0].fd = csp->cfd;
3215 #ifdef FEATURE_CONNECTION_KEEP_ALIVE
3216       if (!watch_client_socket)
3217       {
3218          /*
3219           * Ignore incoming data, but still watch out
3220           * for disconnects etc. These flags are always
3221           * implied anyway but explicitly setting them
3222           * doesn't hurt.
3223           */
3224          poll_fds[0].events = POLLERR|POLLHUP;
3225       }
3226       else
3227 #endif
3228       {
3229          poll_fds[0].events = POLLIN;
3230       }
3231       poll_fds[1].fd = csp->server_connection.sfd;
3232       poll_fds[1].events = POLLIN;
3233       n = poll(poll_fds, 2, csp->config->socket_timeout * 1000);
3234 #else
3235       timeout.tv_sec = csp->config->socket_timeout;
3236       timeout.tv_usec = 0;
3237       n = select((int)maxfd + 1, &rfds, NULL, NULL, &timeout);
3238 #endif /* def HAVE_POLL */
3239
3240       /* Server or client not responding in timeout */
3241       if (n == 0)
3242       {
3243          log_error(LOG_LEVEL_CONNECT, "Socket timeout %d reached: %s",
3244             csp->config->socket_timeout, http->url);
3245          if ((byte_count == 0) && (http->ssl == 0))
3246          {
3247             send_crunch_response(csp, error_response(csp, "connection-timeout"));
3248          }
3249          mark_server_socket_tainted(csp);
3250 #ifdef FEATURE_HTTPS_INSPECTION
3251          close_client_and_server_ssl_connections(csp);
3252 #endif
3253          return;
3254       }
3255       else if (n < 0)
3256       {
3257 #ifdef HAVE_POLL
3258          log_error(LOG_LEVEL_ERROR, "poll() failed!: %E");
3259 #else
3260          log_error(LOG_LEVEL_ERROR, "select() failed!: %E");
3261 #endif
3262          mark_server_socket_tainted(csp);
3263 #ifdef FEATURE_HTTPS_INSPECTION
3264          close_client_and_server_ssl_connections(csp);
3265 #endif
3266          return;
3267       }
3268
3269       /*
3270        * This is the body of the browser's request,
3271        * just read and write it.
3272        *
3273        * Receives data from browser and sends it to server
3274        *
3275        * XXX: Make sure the client doesn't use pipelining
3276        * behind Privoxy's back.
3277        */
3278 #ifdef HAVE_POLL
3279       if ((poll_fds[0].revents & (POLLERR|POLLHUP|POLLNVAL)) != 0)
3280       {
3281          log_error(LOG_LEVEL_CONNECT,
3282             "The client socket %d has become unusable while "
3283             "the server socket %d is still open.",
3284             csp->cfd, csp->server_connection.sfd);
3285          mark_server_socket_tainted(csp);
3286          break;
3287       }
3288
3289       if (poll_fds[0].revents != 0)
3290 #else
3291       if (FD_ISSET(csp->cfd, &rfds))
3292 #endif /* def HAVE_POLL*/
3293       {
3294          int max_bytes_to_read;
3295
3296 #ifdef FEATURE_HTTPS_INSPECTION
3297          client_wants_to_talk:
3298 #endif
3299
3300          max_bytes_to_read = (int)csp->receive_buffer_size;
3301
3302 #ifdef FEATURE_CONNECTION_KEEP_ALIVE
3303          if ((csp->flags & CSP_FLAG_CLIENT_REQUEST_COMPLETELY_READ))
3304          {
3305             if (data_is_available(csp->cfd, 0))
3306             {
3307                /*
3308                 * If the next request is already waiting, we have
3309                 * to stop select()ing the client socket. Otherwise
3310                 * we would always return right away and get nothing
3311                 * else done.
3312                 */
3313                watch_client_socket = 0;
3314                log_error(LOG_LEVEL_CONNECT,
3315                   "Stop watching client socket %d. "
3316                   "There's already another request waiting.",
3317                   csp->cfd);
3318                continue;
3319             }
3320             /*
3321              * If the client socket is set, but there's no data
3322              * available on the socket, the client went fishing
3323              * and continuing talking to the server makes no sense.
3324              */
3325             log_error(LOG_LEVEL_CONNECT,
3326                "The client closed socket %d while "
3327                "the server socket %d is still open.",
3328                csp->cfd, csp->server_connection.sfd);
3329             mark_server_socket_tainted(csp);
3330             break;
3331          }
3332          if (csp->expected_client_content_length != 0)
3333          {
3334             if (csp->expected_client_content_length < csp->receive_buffer_size)
3335             {
3336                max_bytes_to_read = (int)csp->expected_client_content_length;
3337             }
3338             log_error(LOG_LEVEL_CONNECT,
3339                "Waiting for up to %d bytes from the client.",
3340                max_bytes_to_read);
3341          }
3342          assert(max_bytes_to_read <= csp->receive_buffer_size);
3343 #endif /* def FEATURE_CONNECTION_KEEP_ALIVE */
3344
3345 #ifdef FEATURE_HTTPS_INSPECTION
3346          if (client_use_ssl(csp))
3347          {
3348             if (csp->http->status == 101)
3349             {
3350                len = ssl_recv_data(&(csp->ssl_client_attr),
3351                   (unsigned char *)csp->receive_buffer,
3352                   (size_t)max_bytes_to_read);
3353                if (len == -1)
3354                {
3355                   log_error(LOG_LEVEL_ERROR, "Failed to receive data "
3356                      "on client socket %d for an upgraded connection",
3357                      csp->cfd);
3358                   break;
3359                }
3360                if (len == 0)
3361                {
3362                   log_error(LOG_LEVEL_CONNECT, "Done receiving data "
3363                      "on client socket %d for an upgraded connection",
3364                      csp->cfd);
3365                   break;
3366                }
3367                byte_count += (unsigned long long)len;
3368                len = ssl_send_data(&(csp->ssl_server_attr),
3369                   (unsigned char *)csp->receive_buffer, (size_t)len);
3370                if (len == -1)
3371                {
3372                   log_error(LOG_LEVEL_ERROR, "Failed to send data "
3373                      "on server socket %d for an upgraded connection",
3374                      csp->server_connection.sfd);
3375                   break;
3376                }
3377                continue;
3378             }
3379             log_error(LOG_LEVEL_CONNECT, "Breaking with TLS/SSL.");
3380             break;
3381          }
3382          else
3383 #endif /* def FEATURE_HTTPS_INSPECTION */
3384          {
3385             len = read_socket(csp->cfd, csp->receive_buffer, max_bytes_to_read);
3386
3387             if (len <= 0)
3388             {
3389                /* XXX: not sure if this is necessary. */
3390                mark_server_socket_tainted(csp);
3391                break; /* "game over, man" */
3392             }
3393
3394 #ifdef FEATURE_CONNECTION_KEEP_ALIVE
3395             if (csp->expected_client_content_length != 0)
3396             {
3397                assert(len <= max_bytes_to_read);
3398                csp->expected_client_content_length -= (unsigned)len;
3399                log_error(LOG_LEVEL_CONNECT,
3400                   "Expected client content length set to %llu "
3401                   "after reading %ld bytes.",
3402                   csp->expected_client_content_length, len);
3403                if (csp->expected_client_content_length == 0)
3404                {
3405                   log_error(LOG_LEVEL_CONNECT,
3406                      "Done reading from the client.");
3407                   csp->flags |= CSP_FLAG_CLIENT_REQUEST_COMPLETELY_READ;
3408                }
3409             }
3410 #endif /* def FEATURE_CONNECTION_KEEP_ALIVE */
3411
3412             if (write_socket(csp->server_connection.sfd, csp->receive_buffer, (size_t)len))
3413             {
3414                log_error(LOG_LEVEL_ERROR, "write to: %s failed: %E", http->host);
3415                mark_server_socket_tainted(csp);
3416                return;
3417             }
3418          }
3419          continue;
3420       }
3421
3422       /*
3423        * The server wants to talk. It could be the header or the body.
3424        * If `hdr' is null, then it's the header otherwise it's the body.
3425        * FIXME: Does `hdr' really mean `host'? No.
3426        */
3427 #ifdef HAVE_POLL
3428       if (poll_fds[1].revents != 0)
3429 #else
3430       if (FD_ISSET(csp->server_connection.sfd, &rfds))
3431 #endif /* HAVE_POLL */
3432       {
3433 #ifdef FEATURE_HTTPS_INSPECTION
3434          server_wants_to_talk:
3435 #endif
3436 #ifdef FEATURE_CONNECTION_KEEP_ALIVE
3437          /*
3438           * If we are buffering content, we don't want to eat up to
3439           * buffer-limit bytes if the client no longer cares about them.
3440           * If we aren't buffering, however, a dead client socket will be
3441           * noticed pretty much right away anyway, so we can reduce the
3442           * overhead by skipping the check.
3443           */
3444          if (buffer_and_filter_content && !socket_is_still_alive(csp->cfd))
3445          {
3446 #ifdef _WIN32
3447             log_error(LOG_LEVEL_CONNECT,
3448                "The server still wants to talk, but the client may already have hung up on us.");
3449 #else
3450             log_error(LOG_LEVEL_CONNECT,
3451                "The server still wants to talk, but the client hung up on us.");
3452             mark_server_socket_tainted(csp);
3453 #ifdef FEATURE_HTTPS_INSPECTION
3454             close_client_and_server_ssl_connections(csp);
3455 #endif
3456             return;
3457 #endif /* def _WIN32 */
3458          }
3459 #endif /* def FEATURE_CONNECTION_KEEP_ALIVE */
3460
3461 #ifdef FEATURE_HTTPS_INSPECTION
3462          /*
3463           * Reading data from standard or secured connection (HTTP/HTTPS)
3464           */
3465          if (server_use_ssl(csp))
3466          {
3467             len = ssl_recv_data(&(csp->ssl_server_attr),
3468                (unsigned char *)csp->receive_buffer, csp->receive_buffer_size);
3469          }
3470          else
3471 #endif
3472          {
3473             len = read_socket(csp->server_connection.sfd, csp->receive_buffer,
3474                (int)csp->receive_buffer_size);
3475          }
3476
3477          if (len < 0)
3478          {
3479             log_error(LOG_LEVEL_ERROR, "read from: %s failed: %E", http->host);
3480
3481             if ((http->ssl && (csp->fwd == NULL))
3482 #ifdef FEATURE_HTTPS_INSPECTION
3483                && use_ssl_tunnel
3484 #endif
3485                 )
3486             {
3487                /*
3488                 * Just hang up. We already confirmed the client's CONNECT
3489                 * request with status code 200 and unencrypted content is
3490                 * no longer welcome.
3491                 */
3492                log_error(LOG_LEVEL_ERROR,
3493                   "CONNECT already confirmed. Unable to tell the client about the problem.");
3494                return;
3495             }
3496             else if (byte_count)
3497             {
3498                /*
3499                 * Just hang up. We already transmitted the original headers
3500                 * and parts of the original content and therefore missed the
3501                 * chance to send an error message (without risking data corruption).
3502                 *
3503                 * XXX: we could retry with a fancy range request here.
3504                 */
3505                log_error(LOG_LEVEL_ERROR, "Already forwarded the original headers. "
3506                   "Unable to tell the client about the problem.");
3507                mark_server_socket_tainted(csp);
3508 #ifdef FEATURE_HTTPS_INSPECTION
3509                close_client_and_server_ssl_connections(csp);
3510 #endif
3511                return;
3512             }
3513             /*
3514              * XXX: Consider handling the cases above the same.
3515              */
3516             mark_server_socket_tainted(csp);
3517             len = 0;
3518          }
3519
3520 #ifdef FEATURE_CONNECTION_KEEP_ALIVE
3521          if (csp->flags & CSP_FLAG_CHUNKED)
3522          {
3523             if ((len >= 5) && !memcmp(csp->receive_buffer+len-5, "0\r\n\r\n", 5))
3524             {
3525                /* XXX: this is a temporary hack */
3526                log_error(LOG_LEVEL_CONNECT,
3527                   "Looks like we reached the end of the last chunk. "
3528                   "We better stop reading.");
3529                csp->expected_content_length = byte_count + (unsigned long long)len;
3530                csp->flags |= CSP_FLAG_CONTENT_LENGTH_SET;
3531             }
3532          }
3533          reading_done:
3534 #endif  /* FEATURE_CONNECTION_KEEP_ALIVE */
3535
3536          /*
3537           * This is guaranteed by allocating with zalloc_or_die()
3538           * and never (intentionally) writing to the last byte.
3539           *
3540           * csp->receive_buffer_size is the size of the part of the
3541           * buffer we intentionally write to, but we actually
3542           * allocated csp->receive_buffer_size+1 bytes so the assertion
3543           * stays within the allocated range.
3544           */
3545          assert(csp->receive_buffer[csp->receive_buffer_size] == '\0');
3546
3547          /*
3548           * Add a trailing zero to let be able to use string operations.
3549           * XXX: do we still need this with filter_popups gone?
3550           */
3551          assert(len <= csp->receive_buffer_size);
3552          csp->receive_buffer[len] = '\0';
3553
3554          /*
3555           * Normally, this would indicate that we've read
3556           * as much as the server has sent us and we can
3557           * close the client connection.  However, Microsoft
3558           * in its wisdom has released IIS/5 with a bug that
3559           * prevents it from sending the trailing \r\n in
3560           * a 302 redirect header (and possibly other headers).
3561           * To work around this if we've haven't parsed
3562           * a full header we'll append a trailing \r\n
3563           * and see if this now generates a valid one.
3564           *
3565           * This hack shouldn't have any impacts.  If we've
3566           * already transmitted the header or if this is a
3567           * SSL connection, then we won't bother with this
3568           * hack.  So we only work on partially received
3569           * headers.  If we append a \r\n and this still
3570           * doesn't generate a valid header, then we won't
3571           * transmit anything to the client.
3572           */
3573          if (len == 0)
3574          {
3575
3576             if (server_body || (http->ssl
3577 #ifdef FEATURE_HTTPS_INSPECTION
3578                   && use_ssl_tunnel
3579 #endif
3580                ))
3581             {
3582                /*
3583                 * If we have been buffering up the document,
3584                 * now is the time to apply content modification
3585                 * and send the result to the client.
3586                 */
3587                if (buffer_and_filter_content)
3588                {
3589                   p = execute_content_filters(csp);
3590                   /*
3591                    * If content filtering fails, use the original
3592                    * buffer and length.
3593                    * (see p != NULL ? p : csp->iob->cur below)
3594                    */
3595                   if (NULL == p)
3596                   {
3597                      csp->content_length = (size_t)(csp->iob->eod - csp->iob->cur);
3598                   }
3599 #ifdef FEATURE_COMPRESSION
3600                   else if ((csp->flags & CSP_FLAG_CLIENT_SUPPORTS_DEFLATE)
3601                      && (csp->content_length > LOWER_LENGTH_LIMIT_FOR_COMPRESSION))
3602                   {
3603                      char *compressed_content = compress_buffer(p,
3604                         (size_t *)&csp->content_length, csp->config->compression_level);
3605                      if (compressed_content != NULL)
3606                      {
3607                         freez(p);
3608                         p = compressed_content;
3609                         csp->flags |= CSP_FLAG_BUFFERED_CONTENT_DEFLATED;
3610                      }
3611                   }
3612 #endif
3613
3614                   if (JB_ERR_OK != update_server_headers(csp))
3615                   {
3616                      log_error(LOG_LEVEL_FATAL,
3617                         "Failed to update server headers. after filtering.");
3618                   }
3619
3620                   hdr = list_to_text(csp->headers);
3621                   if (hdr == NULL)
3622                   {
3623                      /* FIXME Should handle error properly */
3624                      log_error(LOG_LEVEL_FATAL, "Out of memory parsing server header");
3625                   }
3626
3627 #ifdef FEATURE_HTTPS_INSPECTION
3628                   /*
3629                    * Sending data with standard or secured connection (HTTP/HTTPS)
3630                    */
3631                   if (client_use_ssl(csp))
3632                   {
3633                      if ((ssl_send_data_delayed(&(csp->ssl_client_attr),
3634                               (const unsigned char *)hdr, strlen(hdr),
3635                               get_write_delay(csp)) < 0)
3636                         || (ssl_send_data_delayed(&(csp->ssl_client_attr),
3637                               (const unsigned char *) ((p != NULL) ? p : csp->iob->cur),
3638                               csp->content_length, get_write_delay(csp)) < 0))
3639                      {
3640                         log_error(LOG_LEVEL_ERROR,
3641                            "Failed to send the modified content to the client over TLS");
3642                         freez(hdr);
3643                         freez(p);
3644                         mark_server_socket_tainted(csp);
3645                         close_client_and_server_ssl_connections(csp);
3646                         return;
3647                      }
3648                   }
3649                   else
3650 #endif /* def FEATURE_HTTPS_INSPECTION */
3651                   {
3652                      if (write_socket_delayed(csp->cfd, hdr, strlen(hdr), write_delay)
3653                       || write_socket_delayed(csp->cfd, ((p != NULL) ? p : csp->iob->cur),
3654                          (size_t)csp->content_length, write_delay))
3655                      {
3656                         log_error(LOG_LEVEL_ERROR, "write modified content to client failed: %E");
3657                         freez(hdr);
3658                         freez(p);
3659                         mark_server_socket_tainted(csp);
3660                         return;
3661                      }
3662                   }
3663
3664                   freez(hdr);
3665                   freez(p);
3666                }
3667
3668                break; /* "game over, man" */
3669             }
3670
3671             /*
3672              * This is not the body, so let's pretend the server just sent
3673              * us a blank line.
3674              */
3675             snprintf(csp->receive_buffer, csp->receive_buffer_size, "\r\n");
3676             len = (int)strlen(csp->receive_buffer);
3677
3678             /*
3679              * Now, let the normal header parsing algorithm below do its
3680              * job.  If it fails, we'll exit instead of continuing.
3681              */
3682
3683             ms_iis5_hack = 1;
3684          }
3685
3686          /*
3687           * If we're in the body of the server document, just write it to
3688           * the client, unless we need to buffer the body for later
3689           * content-filtering.
3690           */
3691          if (server_body || (http->ssl
3692 #ifdef FEATURE_HTTPS_INSPECTION
3693                && use_ssl_tunnel
3694 #endif
3695             ))
3696          {
3697             if (buffer_and_filter_content)
3698             {
3699                /*
3700                 * If there is no memory left for buffering the content, or the buffer limit
3701                 * has been reached, switch to non-filtering mode, i.e. make & write the
3702                 * header, flush the iob and buf, and get out of the way.
3703                 */
3704                if (add_to_iob(csp->iob, csp->config->buffer_limit, csp->receive_buffer, len))
3705                {
3706                   size_t hdrlen;
3707                   long flushed;
3708
3709                   log_error(LOG_LEVEL_INFO,
3710                      "Flushing header and buffers. Stepping back from filtering.");
3711
3712                   hdr = list_to_text(csp->headers);
3713                   if (hdr == NULL)
3714                   {
3715                      /*
3716                       * Memory is too tight to even generate the header.
3717                       * Send our static "Out-of-memory" page.
3718                       */
3719                      log_error(LOG_LEVEL_ERROR, "Out of memory while trying to flush.");
3720                      rsp = cgi_error_memory();
3721                      send_crunch_response(csp, rsp);
3722                      mark_server_socket_tainted(csp);
3723 #ifdef FEATURE_HTTPS_INSPECTION
3724                      close_client_and_server_ssl_connections(csp);
3725 #endif
3726                      return;
3727                   }
3728                   hdrlen = strlen(hdr);
3729
3730 #ifdef FEATURE_HTTPS_INSPECTION
3731                   /*
3732                    * Sending data with standard or secured connection (HTTP/HTTPS)
3733                    */
3734                   if (client_use_ssl(csp))
3735                   {
3736                      if ((ssl_send_data_delayed(&(csp->ssl_client_attr),
3737                              (const unsigned char *)hdr, hdrlen, get_write_delay(csp)) < 0)
3738                         || ((flushed = ssl_flush_socket(&(csp->ssl_client_attr),
3739                                 csp->iob)) < 0)
3740                         || (ssl_send_data_delayed(&(csp->ssl_client_attr),
3741                               (const unsigned char *)csp->receive_buffer, (size_t)len,
3742                               get_write_delay(csp)) < 0))
3743                      {
3744                         log_error(LOG_LEVEL_CONNECT,
3745                            "Flush header and buffers to client failed");
3746                         freez(hdr);
3747                         mark_server_socket_tainted(csp);
3748                         close_client_and_server_ssl_connections(csp);
3749                         return;
3750                      }
3751                   }
3752                   else
3753 #endif /* def FEATURE_HTTPS_INSPECTION */
3754                   {
3755                      if (write_socket_delayed(csp->cfd, hdr, hdrlen, write_delay)
3756                       || ((flushed = flush_iob(csp->cfd, csp->iob, write_delay)) < 0)
3757                       || write_socket_delayed(csp->cfd, csp->receive_buffer, (size_t)len,
3758                             write_delay))
3759                      {
3760                         log_error(LOG_LEVEL_CONNECT,
3761                            "Flush header and buffers to client failed: %E");
3762                         freez(hdr);
3763                         mark_server_socket_tainted(csp);
3764                         return;
3765                      }
3766                   }
3767
3768                   /*
3769                    * Reset the byte_count to the amount of bytes
3770                    * we just flushed. len will be added a few lines below,
3771                    * hdrlen doesn't matter for LOG_LEVEL_CLF.
3772                    */
3773                   byte_count = (unsigned long long)flushed;
3774                   freez(hdr);
3775                   buffer_and_filter_content = 0;
3776                   server_body = 1;
3777                }
3778             }
3779             else
3780             {
3781 #ifdef FEATURE_HTTPS_INSPECTION
3782                /*
3783                 * Sending data with standard or secured connection (HTTP/HTTPS)
3784                 */
3785                if (client_use_ssl(csp))
3786                {
3787                   ret = ssl_send_data_delayed(&(csp->ssl_client_attr),
3788                      (const unsigned char *)csp->receive_buffer, (size_t)len,
3789                      get_write_delay(csp));
3790                   if (ret < 0)
3791                   {
3792                      log_error(LOG_LEVEL_ERROR,
3793                         "Sending data to client failed");
3794                      mark_server_socket_tainted(csp);
3795                      close_client_and_server_ssl_connections(csp);
3796                      return;
3797                   }
3798                }
3799                else
3800 #endif /* def FEATURE_HTTPS_INSPECTION */
3801                {
3802                   if (write_socket_delayed(csp->cfd, csp->receive_buffer,
3803                         (size_t)len, write_delay))
3804                   {
3805                      log_error(LOG_LEVEL_ERROR, "write to client failed: %E");
3806                      mark_server_socket_tainted(csp);
3807                      return;
3808                   }
3809                }
3810             }
3811             byte_count += (unsigned long long)len;
3812             continue;
3813          }
3814          else
3815          {
3816             /*
3817              * We're still looking for the end of the server's header.
3818              * Buffer up the data we just read.  If that fails, there's
3819              * little we can do but send our static out-of-memory page.
3820              */
3821             if (add_to_iob(csp->iob, csp->config->buffer_limit, csp->receive_buffer, len))
3822             {
3823                log_error(LOG_LEVEL_ERROR, "Out of memory while looking for end of server headers.");
3824                rsp = cgi_error_memory();
3825                send_crunch_response(csp, rsp);
3826                mark_server_socket_tainted(csp);
3827 #ifdef FEATURE_HTTPS_INSPECTION
3828                close_client_and_server_ssl_connections(csp);
3829 #endif
3830                return;
3831             }
3832
3833             /* Convert iob into something sed() can digest */
3834             if (JB_ERR_PARSE == get_server_headers(csp))
3835             {
3836                if (ms_iis5_hack)
3837                {
3838                   /*
3839                    * Well, we tried our MS IIS/5 hack and it didn't work.
3840                    * The header is incomplete and there isn't anything
3841                    * we can do about it.
3842                    */
3843                   log_error(LOG_LEVEL_ERROR, "Invalid server headers. "
3844                      "Applying the MS IIS5 hack didn't help.");
3845                   log_error(LOG_LEVEL_CLF,
3846                      "%s - - [%T] \"%s\" 502 0", csp->ip_addr_str, http->cmd);
3847 #ifdef FEATURE_HTTPS_INSPECTION
3848                   /*
3849                    * Sending data with standard or secured connection (HTTP/HTTPS)
3850                    */
3851                   if (client_use_ssl(csp))
3852                   {
3853                      ssl_send_data_delayed(&(csp->ssl_client_attr),
3854                         (const unsigned char *)INVALID_SERVER_HEADERS_RESPONSE,
3855                         strlen(INVALID_SERVER_HEADERS_RESPONSE), get_write_delay(csp));
3856                   }
3857                   else
3858 #endif /* def FEATURE_HTTPS_INSPECTION */
3859                   {
3860                      write_socket_delayed(csp->cfd,
3861                         INVALID_SERVER_HEADERS_RESPONSE,
3862                         strlen(INVALID_SERVER_HEADERS_RESPONSE), write_delay);
3863                   }
3864                   mark_server_socket_tainted(csp);
3865 #ifdef FEATURE_HTTPS_INSPECTION
3866                   close_client_and_server_ssl_connections(csp);
3867 #endif
3868                   return;
3869                }
3870                else
3871                {
3872                   /*
3873                    * Since we have to wait for more from the server before
3874                    * we can parse the headers we just continue here.
3875                    */
3876                   log_error(LOG_LEVEL_CONNECT,
3877                      "Continuing buffering server headers from socket %d. "
3878                      "Bytes most recently read: %ld.", csp->cfd, len);
3879                   continue;
3880                }
3881             }
3882             else
3883             {
3884                /*
3885                 * Account for the content bytes we
3886                 * might have gotten with the headers.
3887                 */
3888                assert(csp->iob->eod >= csp->iob->cur);
3889                byte_count = (unsigned long long)(csp->iob->eod - csp->iob->cur);
3890             }
3891
3892             /* Did we actually get anything? */
3893             if (NULL == csp->headers->first)
3894             {
3895                if ((csp->flags & CSP_FLAG_REUSED_CLIENT_CONNECTION))
3896                {
3897                   log_error(LOG_LEVEL_ERROR,
3898                      "No server or forwarder response received on socket %d. "
3899                      "Closing client socket %d without sending data.",
3900                      csp->server_connection.sfd, csp->cfd);
3901                   log_error(LOG_LEVEL_CLF,
3902                      "%s - - [%T] \"%s\" 502 0", csp->ip_addr_str, http->cmd);
3903                }
3904                else
3905                {
3906                   log_error(LOG_LEVEL_ERROR,
3907                      "No server or forwarder response received on socket %d.",
3908                      csp->server_connection.sfd);
3909                   send_crunch_response(csp, error_response(csp, "no-server-data"));
3910                }
3911                free_http_request(http);
3912                mark_server_socket_tainted(csp);
3913 #ifdef FEATURE_HTTPS_INSPECTION
3914                close_client_and_server_ssl_connections(csp);
3915 #endif
3916                return;
3917             }
3918
3919             if (!csp->headers->first->str)
3920             {
3921                log_error(LOG_LEVEL_ERROR, "header search: csp->headers->first->str == NULL, assert will be called");
3922             }
3923             assert(csp->headers->first->str);
3924
3925             if (strncmpic(csp->headers->first->str, "HTTP", 4) &&
3926                 strncmpic(csp->headers->first->str, "ICY", 3))
3927             {
3928                /*
3929                 * It doesn't look like a HTTP (or Shoutcast) response:
3930                 * tell the client and log the problem.
3931                 */
3932                if (strlen(csp->headers->first->str) > 30)
3933                {
3934                   csp->headers->first->str[30] = '\0';
3935                }
3936                log_error(LOG_LEVEL_ERROR,
3937                   "Invalid server or forwarder response. Starts with: %s",
3938                   csp->headers->first->str);
3939                log_error(LOG_LEVEL_CLF,
3940                   "%s - - [%T] \"%s\" 502 0", csp->ip_addr_str, http->cmd);
3941 #ifdef FEATURE_HTTPS_INSPECTION
3942                /*
3943                 * Sending data with standard or secured connection (HTTP/HTTPS)
3944                 */
3945                if (client_use_ssl(csp))
3946                {
3947                   ssl_send_data_delayed(&(csp->ssl_client_attr),
3948                      (const unsigned char *)INVALID_SERVER_HEADERS_RESPONSE,
3949                      strlen(INVALID_SERVER_HEADERS_RESPONSE),
3950                      get_write_delay(csp));
3951                }
3952                else
3953 #endif /* def FEATURE_HTTPS_INSPECTION */
3954                {
3955                   write_socket_delayed(csp->cfd, INVALID_SERVER_HEADERS_RESPONSE,
3956                      strlen(INVALID_SERVER_HEADERS_RESPONSE), write_delay);
3957                }
3958                free_http_request(http);
3959                mark_server_socket_tainted(csp);
3960 #ifdef FEATURE_HTTPS_INSPECTION
3961                close_client_and_server_ssl_connections(csp);
3962 #endif
3963                return;
3964             }
3965
3966             /*
3967              * Disable redirect checkers, so that they will be only run
3968              * again if the user also enables them through tags.
3969              *
3970              * From a performance point of view it doesn't matter,
3971              * but it prevents duplicated log messages.
3972              */
3973 #ifdef FEATURE_FAST_REDIRECTS
3974             csp->action->flags &= ~ACTION_FAST_REDIRECTS;
3975 #endif
3976             csp->action->flags &= ~ACTION_REDIRECT;
3977
3978             /*
3979              * We have now received the entire server header,
3980              * filter it and send the result to the client
3981              */
3982             if (JB_ERR_OK != sed(csp, FILTER_SERVER_HEADERS))
3983             {
3984                log_error(LOG_LEVEL_CLF,
3985                   "%s - - [%T] \"%s\" 502 0", csp->ip_addr_str, http->cmd);
3986 #ifdef FEATURE_HTTPS_INSPECTION
3987                /*
3988                 * Sending data with standard or secured connection (HTTP/HTTPS)
3989                 */
3990                if (client_use_ssl(csp))
3991                {
3992                   ssl_send_data_delayed(&(csp->ssl_client_attr),
3993                      (const unsigned char *)INVALID_SERVER_HEADERS_RESPONSE,
3994                      strlen(INVALID_SERVER_HEADERS_RESPONSE),
3995                      get_write_delay(csp));
3996                }
3997                else
3998 #endif
3999                {
4000                   write_socket_delayed(csp->cfd, INVALID_SERVER_HEADERS_RESPONSE,
4001                      strlen(INVALID_SERVER_HEADERS_RESPONSE), write_delay);
4002                }
4003                free_http_request(http);
4004                mark_server_socket_tainted(csp);
4005 #ifdef FEATURE_HTTPS_INSPECTION
4006                close_client_and_server_ssl_connections(csp);
4007 #endif
4008                return;
4009             }
4010             hdr = list_to_text(csp->headers);
4011             if (hdr == NULL)
4012             {
4013                /* FIXME Should handle error properly */
4014                log_error(LOG_LEVEL_FATAL, "Out of memory parsing server header");
4015             }
4016
4017             if ((csp->flags & CSP_FLAG_CHUNKED)
4018                && !(csp->flags & CSP_FLAG_CONTENT_LENGTH_SET)
4019                && ((csp->iob->eod - csp->iob->cur) >= 5)
4020                && !memcmp(csp->iob->eod-5, "0\r\n\r\n", 5))
4021             {
4022                log_error(LOG_LEVEL_CONNECT,
4023                   "Looks like we got the last chunk together with "
4024                   "the server headers. We better stop reading.");
4025                byte_count = (unsigned long long)(csp->iob->eod - csp->iob->cur);
4026                csp->expected_content_length = byte_count;
4027                csp->flags |= CSP_FLAG_CONTENT_LENGTH_SET;
4028             }
4029
4030             csp->server_connection.response_received = time(NULL);
4031
4032             if (crunch_response_triggered(csp, crunchers_light))
4033             {
4034                /*
4035                 * One of the tags created by a server-header
4036                 * tagger triggered a crunch. We already
4037                 * delivered the crunch response to the client
4038                 * and are done here after cleaning up.
4039                 */
4040                freez(hdr);
4041                mark_server_socket_tainted(csp);
4042 #ifdef FEATURE_HTTPS_INSPECTION
4043                close_client_and_server_ssl_connections(csp);
4044 #endif
4045                return;
4046             }
4047
4048             /* Buffer and pcrs filter this if appropriate. */
4049             buffer_and_filter_content = content_requires_filtering(csp);
4050
4051             if (!buffer_and_filter_content)
4052             {
4053                /*
4054                 * Write the server's (modified) header to
4055                 * the client (along with anything else that
4056                 * may be in the buffer). Use standard or secured
4057                 * connection.
4058                 */
4059 #ifdef FEATURE_HTTPS_INSPECTION
4060                if (client_use_ssl(csp))
4061                {
4062                   if ((ssl_send_data_delayed(&(csp->ssl_client_attr),
4063                           (const unsigned char *)hdr, strlen(hdr),
4064                           get_write_delay(csp)) < 0)
4065                      || ((len = ssl_flush_socket(&(csp->ssl_client_attr),
4066                             csp->iob)) < 0))
4067                   {
4068                      log_error(LOG_LEVEL_CONNECT, "Write header to client failed");
4069
4070                      /*
4071                       * The write failed, so don't bother mentioning it
4072                       * to the client... it probably can't hear us anyway.
4073                       */
4074                      freez(hdr);
4075                      mark_server_socket_tainted(csp);
4076 #ifdef FEATURE_HTTPS_INSPECTION
4077                      close_client_and_server_ssl_connections(csp);
4078 #endif
4079                      return;
4080                   }
4081                }
4082                else
4083 #endif /* def FEATURE_HTTPS_INSPECTION */
4084                {
4085                   if (write_socket_delayed(csp->cfd, hdr, strlen(hdr), write_delay)
4086                      || ((len = flush_iob(csp->cfd, csp->iob, write_delay)) < 0))
4087                   {
4088                      log_error(LOG_LEVEL_ERROR,
4089                         "write header to client failed");
4090                      /*
4091                       * The write failed, so don't bother mentioning it
4092                       * to the client... it probably can't hear us anyway.
4093                       */
4094                      freez(hdr);
4095                      mark_server_socket_tainted(csp);
4096                      return;
4097                   }
4098                }
4099                                 }
4100
4101             /* we're finished with the server's header */
4102
4103             freez(hdr);
4104             server_body = 1;
4105
4106             /*
4107              * If this was a MS IIS/5 hack then it means the server
4108              * has already closed the connection. Nothing more to read.
4109              * Time to bail.
4110              */
4111             if (ms_iis5_hack)
4112             {
4113                log_error(LOG_LEVEL_ERROR,
4114                   "Closed server connection detected. "
4115                   "Applying the MS IIS5 hack didn't help.");
4116                log_error(LOG_LEVEL_CLF,
4117                   "%s - - [%T] \"%s\" 502 0", csp->ip_addr_str, http->cmd);
4118 #ifdef FEATURE_HTTPS_INSPECTION
4119                /*
4120                 * Sending data with standard or secured connection (HTTP/HTTPS)
4121                 */
4122                if (client_use_ssl(csp))
4123                {
4124                   ssl_send_data_delayed(&(csp->ssl_client_attr),
4125                      (const unsigned char *)INVALID_SERVER_HEADERS_RESPONSE,
4126                      strlen(INVALID_SERVER_HEADERS_RESPONSE),
4127                      get_write_delay(csp));
4128                }
4129                else
4130 #endif /* def FEATURE_HTTPS_INSPECTION */
4131                {
4132                   write_socket_delayed(csp->cfd, INVALID_SERVER_HEADERS_RESPONSE,
4133                      strlen(INVALID_SERVER_HEADERS_RESPONSE), write_delay);
4134                }
4135                mark_server_socket_tainted(csp);
4136 #ifdef FEATURE_HTTPS_INSPECTION
4137                close_client_and_server_ssl_connections(csp);
4138 #endif
4139                return;
4140             }
4141          }
4142          continue;
4143       }
4144       mark_server_socket_tainted(csp);
4145 #ifdef FEATURE_HTTPS_INSPECTION
4146       close_client_and_server_ssl_connections(csp);
4147 #endif
4148       return; /* huh? we should never get here */
4149    }
4150
4151    if (csp->content_length == 0)
4152    {
4153       /*
4154        * If Privoxy didn't recalculate the Content-Length,
4155        * byte_count is still correct.
4156        */
4157       csp->content_length = byte_count;
4158    }
4159
4160 #ifdef FEATURE_CONNECTION_KEEP_ALIVE
4161    if ((csp->flags & CSP_FLAG_CONTENT_LENGTH_SET)
4162       && (csp->expected_content_length != byte_count))
4163    {
4164       log_error(LOG_LEVEL_CONNECT,
4165          "Received %llu bytes while expecting %llu.",
4166          byte_count, csp->expected_content_length);
4167       mark_server_socket_tainted(csp);
4168    }
4169 #endif
4170
4171 #ifdef FEATURE_HTTPS_INSPECTION
4172    if (client_use_ssl(csp))
4173    {
4174       log_error(LOG_LEVEL_CLF, "%s - - [%T] \"%s https://%s%s %s\" 200 %llu",
4175          csp->ip_addr_str, http->gpc, http->hostport, http->path,
4176          http->version, csp->content_length);
4177    }
4178    else
4179 #endif
4180    {
4181       log_error(LOG_LEVEL_CLF, "%s - - [%T] \"%s\" 200 %llu",
4182          csp->ip_addr_str, http->ocmd, csp->content_length);
4183    }
4184    csp->server_connection.timestamp = time(NULL);
4185 }
4186
4187
4188 /*********************************************************************
4189  *
4190  * Function    :  chat
4191  *
4192  * Description :  Once a connection from the client has been accepted,
4193  *                this function is called (via serve()) to handle the
4194  *                main business of the communication.  This function
4195  *                returns after dealing with a single request. It can
4196  *                be called multiple times with the same client socket
4197  *                if the client is keeping the connection alive.
4198  *
4199  *                The decision whether or not a client connection will
4200  *                be kept alive is up to the caller which also must
4201  *                close the client socket when done.
4202  *
4203  *                FIXME: chat is nearly thousand lines long.
4204  *                Ridiculous.
4205  *
4206  * Parameters  :
4207  *          1  :  csp = Current client state (buffers, headers, etc...)
4208  *
4209  * Returns     :  Nothing.
4210  *
4211  *********************************************************************/
4212 static void chat(struct client_state *csp)
4213 {
4214    const struct forward_spec *fwd;
4215    struct http_request *http;
4216    /* Skeleton for HTTP response, if we should intercept the request */
4217    struct http_response *rsp;
4218 #ifdef FEATURE_HTTPS_INSPECTION
4219    int use_ssl_tunnel = 0;
4220 #endif
4221
4222    http = csp->http;
4223
4224    if (receive_client_request(csp) != JB_ERR_OK)
4225    {
4226       return;
4227    }
4228
4229 #if defined(FEATURE_STATISTICS) && defined(MUTEX_LOCKS_AVAILABLE)
4230    privoxy_mutex_lock(&block_statistics_mutex);
4231    number_of_requests_received++;
4232    privoxy_mutex_unlock(&block_statistics_mutex);
4233 #endif
4234
4235    if (parse_client_request(csp) != JB_ERR_OK)
4236    {
4237       return;
4238    }
4239
4240 #ifdef FEATURE_HTTPS_INSPECTION
4241    /*
4242     * Setting flags to use old solution with SSL tunnel and to disable
4243     * certificate verification.
4244     */
4245    if (csp->http->ssl && !(csp->action->flags & ACTION_HTTPS_INSPECTION)
4246       && !cgi_page_requested(csp->http->host))
4247    {
4248       use_ssl_tunnel = 1;
4249    }
4250
4251    if (http->ssl && (csp->action->flags & ACTION_IGNORE_CERTIFICATE_ERRORS))
4252    {
4253       csp->dont_verify_certificate = 1;
4254    }
4255 #endif
4256
4257    /*
4258     * build the http request to send to the server
4259     * we have to do one of the following:
4260     *
4261     * create =    use the original HTTP request to create a new
4262     *             HTTP request that has either the path component
4263     *             without the http://domainspec (w/path) or the
4264     *             full orininal URL (w/url)
4265     *             Note that the path and/or the HTTP version may
4266     *             have been altered by now.
4267     *
4268     * SSL proxy = Open a socket to the host:port of the server
4269     *             and create TLS/SSL connection with server and
4270     *             with client. Then behave like mediator between
4271     *             client and server over TLS/SSL.
4272     *
4273     * SSL proxy = Pass the request unchanged if forwarding a CONNECT
4274     *    with     request to a parent proxy. Note that we'll be sending
4275     * forwarding  the CFAIL message ourselves if connecting to the parent
4276     *             fails, but we won't send a CSUCCEED message if it works,
4277     *             since that would result in a double message (ours and the
4278     *             parent's). After sending the request to the parent, we
4279     *             must parse answer and send it to client. If connection
4280     *             with server is established, we do TLS/SSL proxy. Otherwise
4281     *             we send parent response to client and close connections.
4282     *
4283     * here's the matrix:
4284     *                        SSL
4285     *                    0        1
4286     *                +--------+--------+
4287     *                |        |        |
4288     *             0  | create |   SSL  |
4289     *                | w/path |  proxy |
4290     *  Forwarding    +--------+--------+
4291     *                |        |   SSL  |
4292     *             1  | create |  proxy |
4293     *                | w/url  |+forward|
4294     *                +--------+--------+
4295     *
4296     */
4297
4298 #ifdef FEATURE_HTTPS_INSPECTION
4299    /*
4300     * Presetting SSL client and server flags
4301     */
4302    if (http->ssl && !use_ssl_tunnel)
4303    {
4304       http->client_ssl = 1;
4305       http->server_ssl = 1;
4306    }
4307    else
4308    {
4309       http->client_ssl = 0;
4310       http->server_ssl = 0;
4311    }
4312 #endif
4313
4314 #ifdef FEATURE_HTTPS_INSPECTION
4315    /*
4316     * Log the request unless we're https inspecting
4317     * in which case we don't have the path yet and
4318     * will log the request later.
4319     */
4320    if (!client_use_ssl(csp))
4321 #endif
4322    {
4323       log_error(LOG_LEVEL_REQUEST, "%s%s", http->hostport, http->path);
4324    }
4325
4326    if (http->ssl && connect_port_is_forbidden(csp))
4327    {
4328       const char *acceptable_connect_ports =
4329          csp->action->string[ACTION_STRING_LIMIT_CONNECT];
4330       assert(NULL != acceptable_connect_ports);
4331       log_error(LOG_LEVEL_INFO, "Request from %s marked for blocking. "
4332          "limit-connect{%s} doesn't allow CONNECT requests to %s",
4333          csp->ip_addr_str, acceptable_connect_ports, csp->http->hostport);
4334       csp->action->flags |= ACTION_BLOCK;
4335       http->ssl = 0;
4336 #ifdef FEATURE_HTTPS_INSPECTION
4337       http->client_ssl = 0;
4338       http->server_ssl = 0;
4339 #endif
4340    }
4341
4342    /*
4343     * We have a request. Check if one of the crunchers wants it
4344     * unless the client wants to use TLS/SSL in which case we
4345     * haven't setup the TLS context yet and will send the crunch
4346     * response later.
4347     */
4348    if (
4349 #ifdef FEATURE_HTTPS_INSPECTION
4350        !client_use_ssl(csp) &&
4351 #endif
4352        crunch_response_triggered(csp, crunchers_all))
4353    {
4354       /*
4355        * Yes. The client got the crunch response and we're done here.
4356        */
4357       return;
4358    }
4359
4360 #ifdef FEATURE_HTTPS_INSPECTION
4361    if (client_use_ssl(csp) && !use_ssl_tunnel)
4362    {
4363       int ret;
4364       /*
4365        * Creating a SSL proxy.
4366        *
4367        * By sending the CSUCCEED message we're lying to the client as
4368        * the connection hasn't actually been established yet. We don't
4369        * establish the connection until we have seen and parsed the
4370        * encrypted client headers.
4371        */
4372       if (write_socket_delayed(csp->cfd, CSUCCEED,
4373             strlen(CSUCCEED), get_write_delay(csp)) != 0)
4374       {
4375          log_error(LOG_LEVEL_ERROR, "Sending SUCCEED to client failed");
4376          return;
4377       }
4378
4379       ret = create_client_ssl_connection(csp);
4380       if (ret != 0)
4381       {
4382          log_error(LOG_LEVEL_ERROR,
4383             "Failed to open a secure connection with the client");
4384          return;
4385       }
4386       if (JB_ERR_OK != process_encrypted_request_headers(csp))
4387       {
4388          close_client_ssl_connection(csp);
4389          return;
4390       }
4391       /*
4392        * We have an encrypted request. Check if one of the crunchers now
4393        * wants it (for example because the previously invisible path was
4394        * required to match).
4395        */
4396       if (crunch_response_triggered(csp, crunchers_all))
4397       {
4398          /*
4399           * Yes. The client got the crunch response and we're done here.
4400           */
4401          return;
4402       }
4403    }
4404 #endif
4405
4406    log_applied_actions(csp->action);
4407
4408    /* decide how to route the HTTP request */
4409    fwd = forward_url(csp, http);
4410
4411    freez(csp->headers->first->str);
4412    build_request_line(csp, fwd, &csp->headers->first->str);
4413
4414    if (fwd->forward_host)
4415    {
4416       log_error(LOG_LEVEL_CONNECT, "via [%s]:%d to: %s",
4417          fwd->forward_host, fwd->forward_port, http->hostport);
4418    }
4419    else
4420    {
4421       log_error(LOG_LEVEL_CONNECT, "to %s", http->hostport);
4422    }
4423
4424    /* here we connect to the server, gateway, or the forwarder */
4425
4426 #ifdef FEATURE_CONNECTION_KEEP_ALIVE
4427    if ((csp->server_connection.sfd != JB_INVALID_SOCKET)
4428       && socket_is_still_alive(csp->server_connection.sfd)
4429       && connection_destination_matches(&csp->server_connection, http, fwd))
4430    {
4431       log_error(LOG_LEVEL_CONNECT,
4432          "Reusing server socket %d connected to %s. Total requests: %u.",
4433          csp->server_connection.sfd, csp->server_connection.host,
4434          csp->server_connection.requests_sent_total);
4435    }
4436    else
4437    {
4438       if (csp->server_connection.sfd != JB_INVALID_SOCKET)
4439       {
4440 #ifdef FEATURE_CONNECTION_SHARING
4441          if (csp->config->feature_flags & RUNTIME_FEATURE_CONNECTION_SHARING
4442 #ifdef FEATURE_HTTPS_INSPECTION
4443             && !server_use_ssl(csp)
4444 #endif
4445             )
4446          {
4447             remember_connection(&csp->server_connection);
4448          }
4449          else
4450 #endif /* def FEATURE_CONNECTION_SHARING */
4451          {
4452             log_error(LOG_LEVEL_CONNECT,
4453                "Closing server socket %d connected to %s. Total requests: %u.",
4454                csp->server_connection.sfd, csp->server_connection.host,
4455                csp->server_connection.requests_sent_total);
4456             close_socket(csp->server_connection.sfd);
4457          }
4458          mark_connection_closed(&csp->server_connection);
4459       }
4460 #endif /* def FEATURE_CONNECTION_KEEP_ALIVE */
4461
4462       /*
4463        * Connecting to destination server
4464        */
4465       csp->server_connection.sfd = forwarded_connect(fwd, http, csp);
4466
4467       if (csp->server_connection.sfd == JB_INVALID_SOCKET)
4468       {
4469          if (fwd->type != SOCKS_NONE)
4470          {
4471             /* Socks error. */
4472             rsp = error_response(csp, "forwarding-failed");
4473          }
4474          else if (errno == EINVAL)
4475          {
4476             rsp = error_response(csp, "no-such-domain");
4477          }
4478          else
4479          {
4480             rsp = error_response(csp, "connect-failed");
4481          }
4482
4483          /* Write the answer to the client */
4484          if (rsp != NULL)
4485          {
4486             send_crunch_response(csp, rsp);
4487          }
4488
4489          /*
4490           * Temporary workaround to prevent already-read client
4491           * bodies from being parsed as new requests. For now we
4492           * err on the safe side and throw all the following
4493           * requests under the bus, even if no client body has been
4494           * buffered. A compliant client will repeat the dropped
4495           * requests on an untainted connection.
4496           *
4497           * The proper fix is to discard the no longer needed
4498           * client body in the buffer (if there is one) and to
4499           * continue parsing the bytes that follow.
4500           */
4501 #ifdef FEATURE_HTTPS_INSPECTION
4502          close_client_ssl_connection(csp);
4503 #endif
4504          drain_and_close_socket(csp->cfd);
4505          csp->cfd = JB_INVALID_SOCKET;
4506
4507          return;
4508       }