1 #ifndef PARSERS_H_INCLUDED
2 #define PARSERS_H_INCLUDED
3 #define PARSERS_H_VERSION "$Id: parsers.h,v 1.46 2008/05/21 15:47:14 fabiankeil Exp $"
4 /*********************************************************************
6 * File : $Source: /cvsroot/ijbswa/current/parsers.h,v $
8 * Purpose : Declares functions to parse/crunch headers and pages.
9 * Functions declared include:
10 * `add_to_iob', `client_cookie_adder', `client_from',
11 * `client_referrer', `client_send_cookie', `client_ua',
12 * `client_uagent', `client_x_forwarded',
13 * `client_x_forwarded_adder', `client_xtra_adder',
14 * `content_type', `crumble', `destroy_list', `enlist',
15 * `flush_socket', `free_http_request', `get_header',
16 * `list_to_text', `parse_http_request', `sed',
17 * and `server_set_cookie'.
19 * Copyright : Written by and Copyright (C) 2001 the SourceForge
20 * Privoxy team. http://www.privoxy.org/
22 * Based on the Internet Junkbuster originally written
23 * by and Copyright (C) 1997 Anonymous Coders and
24 * Junkbusters Corporation. http://www.junkbusters.com
26 * This program is free software; you can redistribute it
27 * and/or modify it under the terms of the GNU General
28 * Public License as published by the Free Software
29 * Foundation; either version 2 of the License, or (at
30 * your option) any later version.
32 * This program is distributed in the hope that it will
33 * be useful, but WITHOUT ANY WARRANTY; without even the
34 * implied warranty of MERCHANTABILITY or FITNESS FOR A
35 * PARTICULAR PURPOSE. See the GNU General Public
36 * License for more details.
38 * The GNU General Public License should be included with
39 * this file. If not, you can view it at
40 * http://www.gnu.org/copyleft/gpl.html
41 * or write to the Free Software Foundation, Inc., 59
42 * Temple Place - Suite 330, Boston, MA 02111-1307, USA.
46 * Revision 1.46 2008/05/21 15:47:14 fabiankeil
47 * Streamline sed()'s prototype and declare
48 * the header parse and add structures static.
50 * Revision 1.45 2008/05/20 20:13:30 fabiankeil
51 * Factor update_server_headers() out of sed(), ditch the
52 * first_run hack and make server_patterns_light static.
54 * Revision 1.44 2008/05/20 16:05:09 fabiankeil
55 * Move parsers structure definition from project.h to parsers.h.
57 * Revision 1.43 2008/05/10 13:23:38 fabiankeil
58 * Don't provide get_header() with the whole client state
59 * structure when it only needs access to csp->iob.
61 * Revision 1.42 2008/04/17 14:40:49 fabiankeil
62 * Provide get_http_time() with the buffer size so it doesn't
63 * have to blindly assume that the buffer is big enough.
65 * Revision 1.41 2008/04/16 16:38:21 fabiankeil
66 * Don't pass the whole csp structure to flush_socket()
67 * when it only needs a file descriptor and a buffer.
69 * Revision 1.40 2007/08/11 14:47:26 fabiankeil
70 * Remove the prototypes for functions that are only
71 * used in parsers.c and thus should be static.
73 * Revision 1.39 2007/06/01 16:31:55 fabiankeil
74 * Change sed() to return a jb_err in preparation for forward-override{}.
76 * Revision 1.38 2007/03/25 14:27:11 fabiankeil
77 * Let parse_header_time() return a jb_err code
78 * instead of a pointer that can only be used to
79 * check for NULL anyway.
81 * Revision 1.37 2007/03/20 15:22:17 fabiankeil
82 * - Remove filter_client_header() and filter_client_header(),
83 * filter_header() now checks the shiny new
84 * CSP_FLAG_CLIENT_HEADER_PARSING_DONE flag instead.
86 * Revision 1.36 2007/03/05 13:25:32 fabiankeil
87 * - Cosmetical changes for LOG_LEVEL_RE_FILTER messages.
88 * - Handle "Cookie:" and "Connection:" headers a bit smarter
89 * (don't crunch them just to recreate them later on).
90 * - Add another non-standard time format for the cookie
91 * expiration date detection.
92 * - Fix a valgrind warning.
94 * Revision 1.35 2007/01/01 19:36:37 fabiankeil
95 * Integrate a modified version of Wil Mahan's
96 * zlib patch (PR #895531).
98 * Revision 1.34 2006/12/29 19:08:22 fabiankeil
99 * Reverted parts of my last commit
100 * to keep error handling working.
102 * Revision 1.33 2006/12/29 18:04:40 fabiankeil
103 * Fixed gcc43 conversion warnings.
105 * Revision 1.32 2006/12/06 19:14:23 fabiankeil
106 * Added prototype for get_destination_from_headers().
108 * Revision 1.31 2006/08/17 17:15:10 fabiankeil
109 * - Back to timegm() using GnuPG's replacement if necessary.
110 * Using mktime() and localtime() could add a on hour offset if
111 * the randomize factor was big enough to lead to a summer/wintertime
114 * - Removed now-useless Privoxy 3.0.3 compatibility glue.
116 * - Moved randomization code into pick_from_range().
118 * - Changed parse_header_time definition.
119 * time_t isn't guaranteed to be signed and
120 * if it isn't, -1 isn't available as error code.
121 * Changed some variable types in client_if_modified_since()
122 * because of the same reason.
124 * Revision 1.30 2006/08/14 08:25:19 fabiankeil
125 * Split filter-headers{} into filter-client-headers{}
126 * and filter-server-headers{}.
127 * Added parse_header_time() to share some code.
128 * Replaced timegm() with mktime().
130 * Revision 1.29 2006/08/03 02:46:41 david__schmidt
131 * Incorporate Fabian Keil's patch work:
\rhttp://www.fabiankeil.de/sourcecode/privoxy/
133 * Revision 1.28 2006/07/18 14:48:47 david__schmidt
134 * Reorganizing the repository: swapping out what was HEAD (the old 3.1 branch)
135 * with what was really the latest development (the v_3_0_branch branch)
137 * Revision 1.26.2.1 2002/09/25 14:52:46 oes
138 * Added basic support for OPTIONS and TRACE HTTP methods:
139 * - New parser function client_max_forwards which decrements
140 * the Max-Forwards HTTP header field of OPTIONS and TRACE
141 * requests by one before forwarding
142 * - New parser function client_host which extracts the host
143 * and port information from the HTTP header field if the
144 * request URI was not absolute
145 * - Don't crumble and re-add the Host: header, but only generate
146 * and append if missing
148 * Revision 1.26 2002/05/08 15:59:53 oes
149 * Changed add_to_iob signature (now returns jb_err)
151 * Revision 1.25 2002/03/26 22:29:55 swa
152 * we have a new homepage!
154 * Revision 1.24 2002/03/24 13:25:43 swa
155 * name change related issues
157 * Revision 1.23 2002/03/13 00:27:05 jongfoster
160 * Revision 1.22 2002/03/09 20:03:52 jongfoster
161 * - Making various functions return int rather than size_t.
162 * (Undoing a recent change). Since size_t is unsigned on
163 * Windows, functions like read_socket that return -1 on
164 * error cannot return a size_t.
166 * THIS WAS A MAJOR BUG - it caused frequent, unpredictable
167 * crashes, and also frequently caused JB to jump to 100%
168 * CPU and stay there. (Because it thought it had just
169 * read ((unsigned)-1) == 4Gb of data...)
171 * - The signature of write_socket has changed, it now simply
172 * returns success=0/failure=nonzero.
174 * - Trying to get rid of a few warnings --with-debug on
175 * Windows, I've introduced a new type "jb_socket". This is
176 * used for the socket file descriptors. On Windows, this
177 * is SOCKET (a typedef for unsigned). Everywhere else, it's
178 * an int. The error value can't be -1 any more, so it's
179 * now JB_INVALID_SOCKET (which is -1 on UNIX, and in
180 * Windows it maps to the #define INVALID_SOCKET.)
182 * - The signature of bind_port has changed.
184 * Revision 1.21 2002/03/07 03:46:17 oes
185 * Fixed compiler warnings
187 * Revision 1.20 2002/02/20 23:15:13 jongfoster
188 * Parsing functions now handle out-of-memory gracefully by returning
191 * Revision 1.19 2002/01/17 21:03:47 jongfoster
192 * Moving all our URL and URL pattern parsing code to urlmatch.c.
194 * Revision 1.18 2001/10/26 17:40:23 oes
195 * Introduced get_header_value()
196 * Removed client_accept()
198 * Revision 1.17 2001/10/13 12:47:32 joergs
199 * Removed client_host, added client_host_adder
201 * Revision 1.16 2001/10/07 18:50:16 oes
202 * Added server_content_encoding, renamed server_transfer_encoding
204 * Revision 1.15 2001/10/07 18:01:55 oes
205 * Changed server_http11 to server_http
207 * Revision 1.14 2001/10/07 15:45:48 oes
208 * added client_accept_encoding, client_te, client_accept_encoding_adder
210 * renamed content_type and content_length
212 * fixed client_host and strclean prototypes
214 * Revision 1.13 2001/09/29 12:56:03 joergs
215 * IJB now changes HTTP/1.1 to HTTP/1.0 in requests and answers.
217 * Revision 1.12 2001/09/13 23:05:50 jongfoster
218 * Changing the string paramater to the header parsers a "const".
220 * Revision 1.11 2001/07/31 14:46:53 oes
221 * Added prototype for connection_close_adder
223 * Revision 1.10 2001/07/30 22:08:36 jongfoster
224 * Tidying up #defines:
225 * - All feature #defines are now of the form FEATURE_xxx
226 * - Permanently turned off WIN_GUI_EDIT
227 * - Permanently turned on WEBDAV and SPLIT_PROXY_ARGS
229 * Revision 1.9 2001/07/29 18:43:08 jongfoster
230 * Changing #ifdef _FILENAME_H to FILENAME_H_INCLUDED, to conform to
233 * Revision 1.8 2001/07/13 14:01:54 oes
234 * Removed all #ifdef PCRS
236 * Revision 1.7 2001/06/29 13:32:14 oes
237 * Removed logentry from cancelled commit
239 * Revision 1.6 2001/06/03 19:12:38 oes
240 * deleted const struct interceptors
242 * Revision 1.5 2001/05/31 21:30:33 jongfoster
243 * Removed list code - it's now in list.[ch]
244 * Renamed "permission" to "action", and changed many features
245 * to use the actions file rather than the global config.
247 * Revision 1.4 2001/05/27 13:19:06 oes
248 * Patched Joergs solution for the content-length in.
250 * Revision 1.3 2001/05/26 13:39:32 jongfoster
251 * Only crunches Content-Length header if applying RE filtering.
252 * Without this fix, Microsoft Windows Update wouldn't work.
254 * Revision 1.2 2001/05/20 01:21:20 jongfoster
255 * Version 2.9.4 checkin.
256 * - Merged popupfile and cookiefile, and added control over PCRS
257 * filtering, in new "permissionsfile".
258 * - Implemented LOG_LEVEL_FATAL, so that if there is a configuration
259 * file error you now get a message box (in the Win32 GUI) rather
260 * than the program exiting with no explanation.
261 * - Made killpopup use the PCRS MIME-type checking and HTTP-header
263 * - Removed tabs from "config"
264 * - Moved duplicated url parsing code in "loaders.c" to a new funcition.
265 * - Bumped up version number.
267 * Revision 1.1.1.1 2001/05/15 13:59:01 oes
268 * Initial import of version 2.9.3 source tree
271 *********************************************************************/
280 /* Used for sed()'s second argument. */
281 #define FILTER_CLIENT_HEADERS 0
282 #define FILTER_SERVER_HEADERS 1
284 extern int flush_socket(jb_socket fd, struct iob *iob);
285 extern jb_err add_to_iob(struct client_state *csp, char *buf, int n);
286 extern jb_err decompress_iob(struct client_state *csp);
287 extern char *get_header(struct iob *iob);
288 extern char *get_header_value(const struct list *header_list, const char *header_name);
289 extern jb_err sed(struct client_state *csp, int filter_server_headers);
290 extern jb_err update_server_headers(struct client_state *csp);
291 extern void get_http_time(int time_offset, char *buf, size_t buffer_size);
292 extern jb_err get_destination_from_headers(const struct list *headers, struct http_request *http);
294 #ifdef FEATURE_FORCE_LOAD
295 extern int strclean(char *string, const char *substring);
296 #endif /* def FEATURE_FORCE_LOAD */
298 /* Revision control strings from this header and associated .c file */
299 extern const char parsers_rcs[];
300 extern const char parsers_h_rcs[];
308 #endif /* ndef PARSERS_H_INCLUDED */