X-Git-Url: http://www.privoxy.org/gitweb/?p=privoxy.git;a=blobdiff_plain;f=project.h;h=683296844eb7593819c25618f1b8b680560e2ff9;hp=7371d659e6287e45ddbad4988a36db59025506f3;hb=5f4fdef17eb7cb66f186168c8be1433618dc5eb7;hpb=87a69fc505def6be1c8a4d24ae225c3623b5e861 diff --git a/project.h b/project.h index 7371d659..68329684 100644 --- a/project.h +++ b/project.h @@ -1,6 +1,6 @@ #ifndef _PROJECT_H #define _PROJECT_H -#define PROJECT_H_VERSION "$Id: project.h,v 1.2 2001/05/17 23:01:01 oes Exp $" +#define PROJECT_H_VERSION "$Id: project.h,v 1.12 2001/06/01 18:49:17 jongfoster Exp $" /********************************************************************* * * File : $Source: /cvsroot/ijbswa/current/project.h,v $ @@ -36,6 +36,126 @@ * * Revisions : * $Log: project.h,v $ + * Revision 1.12 2001/06/01 18:49:17 jongfoster + * Replaced "list_share" with "list" - the tiny memory gain was not + * worth the extra complexity. + * + * Revision 1.11 2001/06/01 10:32:47 oes + * Added constants for anchoring selection bitmap + * + * Revision 1.10 2001/05/31 21:33:53 jongfoster + * Changes for new actions file, replacing permissionsfile + * and parts of the config file. Also added support for + * list_shared. + * + * Revision 1.9 2001/05/31 17:32:31 oes + * + * - Enhanced domain part globbing with infix and prefix asterisk + * matching and optional unanchored operation + * + * Revision 1.8 2001/05/29 20:09:15 joergs + * HTTP_REDIRECT_TEMPLATE fixed. + * + * Revision 1.7 2001/05/29 09:50:24 jongfoster + * Unified blocklist/imagelist/actionslist. + * File format is still under discussion, but the internal changes + * are (mostly) done. + * + * Also modified interceptor behaviour: + * - We now intercept all URLs beginning with one of the following + * prefixes (and *only* these prefixes): + * * http://i.j.b/ + * * http://ijbswa.sf.net/config/ + * * http://ijbswa.sourceforge.net/config/ + * - New interceptors "home page" - go to http://i.j.b/ to see it. + * - Internal changes so that intercepted and fast redirect pages + * are not replaced with an image. + * - Interceptors now have the option to send a binary page direct + * to the client. (i.e. ijb-send-banner uses this) + * - Implemented show-url-info interceptor. (Which is why I needed + * the above interceptors changes - a typical URL is + * "http://i.j.b/show-url-info?url=www.somesite.com/banner.gif". + * The previous mechanism would not have intercepted that, and + * if it had been intercepted then it then it would have replaced + * it with an image.) + * + * Revision 1.6 2001/05/27 22:17:04 oes + * + * - re_process_buffer no longer writes the modified buffer + * to the client, which was very ugly. It now returns the + * buffer, which it is then written by chat. + * + * - content_length now adjusts the Content-Length: header + * for modified documents rather than crunch()ing it. + * (Length info in csp->content_length, which is 0 for + * unmodified documents) + * + * - For this to work, sed() is called twice when filtering. + * + * Revision 1.5 2001/05/26 00:28:36 jongfoster + * Automatic reloading of config file. + * Removed obsolete SIGHUP support (Unix) and Reload menu option (Win32). + * Most of the global variables have been moved to a new + * struct configuration_spec, accessed through csp->config->globalname + * Most of the globals remaining are used by the Win32 GUI. + * + * Revision 1.4 2001/05/22 18:46:04 oes + * + * - Enabled filtering banners by size rather than URL + * by adding patterns that replace all standard banner + * sizes with the "Junkbuster" gif to the re_filterfile + * + * - Enabled filtering WebBugs by providing a pattern + * which kills all 1x1 images + * + * - Added support for PCRE_UNGREEDY behaviour to pcrs, + * which is selected by the (nonstandard and therefore + * capital) letter 'U' in the option string. + * It causes the quantifiers to be ungreedy by default. + * Appending a ? turns back to greedy (!). + * + * - Added a new interceptor ijb-send-banner, which + * sends back the "Junkbuster" gif. Without imagelist or + * MSIE detection support, or if tinygif = 1, or the + * URL isn't recognized as an imageurl, a lame HTML + * explanation is sent instead. + * + * - Added new feature, which permits blocking remote + * script redirects and firing back a local redirect + * to the browser. + * The feature is conditionally compiled, i.e. it + * can be disabled with --disable-fast-redirects, + * plus it must be activated by a "fast-redirects" + * line in the config file, has its own log level + * and of course wants to be displayed by show-proxy-args + * Note: Boy, all the #ifdefs in 1001 locations and + * all the fumbling with configure.in and acconfig.h + * were *way* more work than the feature itself :-( + * + * - Because a generic redirect template was needed for + * this, tinygif = 3 now uses the same. + * + * - Moved GIFs, and other static HTTP response templates + * to project.h + * + * - Some minor fixes + * + * - Removed some >400 CRs again (Jon, you really worked + * a lot! ;-) + * + * Revision 1.3 2001/05/20 01:21:20 jongfoster + * Version 2.9.4 checkin. + * - Merged popupfile and cookiefile, and added control over PCRS + * filtering, in new "actionsfile". + * - Implemented LOG_LEVEL_FATAL, so that if there is a configuration + * file error you now get a message box (in the Win32 GUI) rather + * than the program exiting with no explanation. + * - Made killpopup use the PCRS MIME-type checking and HTTP-header + * skipping. + * - Removed tabs from "config" + * - Moved duplicated url parsing code in "loaders.c" to a new funcition. + * - Bumped up version number. + * * Revision 1.2 2001/05/17 23:01:01 oes * - Cleaned CRLF's from the sources and related files * @@ -105,6 +225,9 @@ extern "C" { /* Need this for struct gateway */ struct client_state; +/* Need this for struct client_state */ +struct configuration_spec; + struct http_request { @@ -118,7 +241,6 @@ struct http_request int ssl; }; - struct gateway { /* generic attributes */ @@ -135,15 +257,38 @@ struct gateway }; -struct proxy_args +/* Generic linked list of strings */ +struct list /* FIXME: Why not separate entries and header? */ { - char *header; - char *invocation; - char *gateways; - char *trailer; + char * str; /* valid in an entry */ + struct list *last; /* valid in header */ + struct list *next; }; +/* A URL pattern */ +struct url_spec +{ + char *spec; + char *domain; /* fqdn */ + char *dbuf; + char **dvec; /* Domain ptr vector */ + int dcnt; /* How many domains in fqdn? */ + int unanchored; /* bitmap 0: left, 1: right */ + + char *path; + int pathlen; + int port; +#ifdef REGEX + regex_t *preg; +#endif +}; + +#define ANCHOR_LEFT 1 +#define ANCHOR_RIGHT 2 + + +/* An I/O buffer */ struct iob { char *buf; @@ -152,15 +297,81 @@ struct iob }; -struct list +#define IOB_PEEK(CSP) ((CSP->iob->cur > CSP->iob->eod) ? (CSP->iob->eod - CSP->iob->cur) : 0) +#define IOB_RESET(CSP) if(CSP->iob->buf) free(CSP->iob->buf); memset(CSP->iob, '\0', sizeof(CSP->iob)); + + + +#define ACTION_MASK_ALL (~0U) + +#define ACTION_MOST_COMPATIBLE 0U + +#define ACTION_BLOCK 0x0001U +#define ACTION_FAST_REDIRECTS 0x0002U +#define ACTION_FILTER 0x0004U +#define ACTION_HIDE_FORWARDED 0x0008U +#define ACTION_HIDE_FROM 0x0010U +#define ACTION_HIDE_REFERER 0x0020U /* sic - follow HTTP, not English */ +#define ACTION_HIDE_USER_AGENT 0x0040U +#define ACTION_IMAGE 0x0080U +#define ACTION_IMAGE_BLOCKER 0x0100U +#define ACTION_NO_COOKIE_READ 0x0200U +#define ACTION_NO_COOKIE_SET 0x0400U +#define ACTION_NO_POPUPS 0x0800U +#define ACTION_VANILLA_WAFER 0x1000U + +#define ACTION_STRING_FROM 0 +#define ACTION_STRING_IMAGE_BLOCKER 1 +#define ACTION_STRING_REFERER 2 +#define ACTION_STRING_USER_AGENT 3 +#define ACTION_STRING_COUNT 4 + +#define ACTION_MULTI_ADD_HEADER 0 +#define ACTION_MULTI_WAFER 1 +#define ACTION_MULTI_COUNT 2 + + +struct current_action_spec { - char *str; - struct list *last; - struct list *next; + unsigned flags; /* a bit set to "1" = add action */ + + /* For those actions that require parameters: */ + + /* each entry is valid if & only if corresponding entry in "add" set. */ + char * string[ACTION_STRING_COUNT]; + + /* Strings to add */ + struct list multi[ACTION_MULTI_COUNT][1]; }; -#define IOB_PEEK(CSP) ((CSP->iob->cur > CSP->iob->eod) ? (CSP->iob->eod - CSP->iob->cur) : 0) -#define IOB_RESET(CSP) if(CSP->iob->buf) free(CSP->iob->buf); memset(CSP->iob, '\0', sizeof(CSP->iob)); +struct action_spec +{ + unsigned mask; /* a bit set to "0" = remove action */ + unsigned add; /* a bit set to "1" = add action */ + + /* For those actions that require parameters: */ + + /* each entry is valid if & only if corresponding entry in "add" set. */ + char * string[ACTION_STRING_COUNT]; + + /* Strings to remove. */ + struct list multi_remove[ACTION_MULTI_COUNT][1]; + + /* If nonzero, remove *all* strings. */ + int multi_remove_all[ACTION_MULTI_COUNT]; + + /* Strings to add */ + struct list multi_add[ACTION_MULTI_COUNT][1]; +}; + +struct url_actions +{ + struct url_spec url[1]; + + struct action_spec action[1]; + + struct url_actions * next; +}; /* Constants defining bitmask for csp->accept_types */ @@ -188,11 +399,21 @@ struct list struct client_state { - int permissions; - + /* The proxy's configuration */ + struct configuration_spec * config; + + + /* The actions to perform on the current request */ + struct current_action_spec action[1]; + + + /* socket to talk to client (web browser) */ int cfd; + + /* socket to talk to server (web server or proxy) */ int sfd; + #ifdef STATISTICS /* 1 if this URL was rejected, 0 otherwise. Allows actual stats inc to * occur in main thread only for thread-safety. @@ -205,17 +426,20 @@ struct client_state #endif /* def FORCE_LOAD */ #ifdef TOGGLE - /* - * by haroon - most of credit to srt19170 - * We add an "on/off" toggle here that is used to effectively toggle - * the Junkbuster off or on - */ int toggled_on; -#endif +#endif /* def TOGGLE */ + /* + * Client PC's IP address, as reported by the accept()_ function. + * Both as string and number + */ char *ip_addr_str; long ip_addr_long; + +#ifdef TRUST_FILES + /* The referer in this request, if one was specified. */ char *referrer; +#endif /* def TRUST_FILES */ #if defined(DETECT_MSIE_IMAGES) /* Types the client will accept. @@ -224,43 +448,50 @@ struct client_state int accept_types; #endif /* defined(DETECT_MSIE_IMAGES) */ - const struct gateway *gw; + /* The URL that was requested */ struct http_request http[1]; + /* An I/O buffer used for buffering data read from the client */ struct iob iob[1]; + /* List of all headers for this request */ struct list headers[1]; + + /* List of all cookies for this request */ struct list cookie_list[1]; + #if defined(PCRS) || defined(KILLPOPUPS) + /* Nonzero if this has a text MIME type */ int is_text; #endif /* defined(PCRS) || defined(KILLPOPUPS) */ + /* The "X-Forwarded-For:" header sent by the client */ char *x_forwarded; + /* + * Nonzero if this client is processing data. + * Set to zero when the thread associated with this structure dies. + */ int active; /* files associated with this client */ - struct file_list *blist; /* blockfile */ struct file_list *flist; /* forwardfile */ - struct file_list *permissions_list; - + struct file_list *actions_list; + -#ifdef ACL_FILES +#ifdef ACL_FILES struct file_list *alist; /* aclfile */ #endif /* def ACL_FILES */ -#ifdef USE_IMAGE_LIST - struct file_list *ilist; /* imagefile */ -#endif /* def USE_IMAGE_LIST */ - #ifdef PCRS struct file_list *rlist; /* Perl re_filterfile */ + size_t content_length; /* Length after processing */ #endif /* def PCRS */ #ifdef TRUST_FILES struct file_list *tlist; /* trustfile */ #endif /* def TRUST_FILES */ - + struct client_state *next; }; @@ -281,26 +512,6 @@ struct interceptors }; -/* this allows the proxy to permit/block access to any host and/or path */ - -struct url_spec -{ - char *spec; - char *domain; - char *dbuf; - char **dvec; - int dcnt; - int toplevel; - - char *path; - int pathlen; - int port; -#ifdef REGEX - regex_t *preg; -#endif -}; - - struct file_list { /* @@ -343,30 +554,19 @@ struct file_list }; +#ifdef TRUST_FILES struct block_spec { struct url_spec url[1]; int reject; struct block_spec *next; }; - - -#define PERMIT_COOKIE_SET 0x0001 -#define PERMIT_COOKIE_READ 0x0002 -#define PERMIT_RE_FILTER 0x0004 -#define PERMIT_POPUPS 0x0008 - -struct permissions_spec -{ - struct url_spec url[1]; - int permissions; - struct permissions_spec * next; -}; - +#endif /* def TRUST_FILES */ + + struct forward_spec { struct url_spec url[1]; - int reject; struct gateway gw[1]; struct forward_spec *next; }; @@ -380,7 +580,7 @@ struct re_filterfile_spec pcrs_job *joblist; }; #endif /* def PCRS */ - + #ifdef ACL_FILES #define ACL_PERMIT 1 /* accept connection request */ @@ -403,6 +603,78 @@ struct access_control_list }; #endif /* def ACL_FILES */ + +/* Maximum number of loaders (actions, block, forward, acl...) */ +#define NLOADERS 8 + +/* + * Data loaded from the configuration file. + * + * (Anomaly: toggle is still handled through a global, not this structure) + */ +struct configuration_spec +{ + int debug; + int multi_threaded; + + const char *logfile; + + const char *actions_file; + const char *forwardfile; + +#ifdef ACL_FILES + const char *aclfile; +#endif /* def ACL_FILES */ + +#ifdef PCRS + const char *re_filterfile; +#endif /* def PCRS */ + +#ifdef JAR_FILES + const char * jarfile; + FILE * jar; +#endif /* def JAR_FILES */ + + /* + * Port and IP to bind to. + * Defaults to HADDR_DEFAULT:HADDR_PORT == 127.0.0.1:8000 + */ + const char *haddr; + int hport; + +#ifndef SPLIT_PROXY_ARGS + const char *suppress_message; +#endif /* ndef SPLIT_PROXY_ARGS */ + +#ifndef SPLIT_PROXY_ARGS + /* suppress listing config files */ + int suppress_blocklists; +#endif /* ndef SPLIT_PROXY_ARGS */ + +#ifdef TRUST_FILES + const char * trustfile; + + struct list trust_info[1]; + struct url_spec *trust_list[64]; +#endif /* def TRUST_FILES */ + + /* Various strings for show-proxy-args */ + char *proxy_args_header; + char *proxy_args_invocation; + char *proxy_args_gateways; + char *proxy_args_trailer; + + /* the configuration file object. */ + struct file_list *config_file_list; + + /* List of loaders */ + int (*loaders[NLOADERS])(struct client_state *); + + /* bool, nonzero if we need to bind() to the new port */ + int need_bind; +}; + + #define SZ(X) (sizeof(X) / sizeof(*X)) #define WHITEBG "\n" @@ -410,20 +682,113 @@ struct access_control_list #define BANNER "Internet JUNKBUSTER" #ifdef FORCE_LOAD -/* - * FIXME: Unfortunately, IE lowercases the domain name. JunkBuster does - * a case-sensitive compare. JunkBuster should be modified to do a - * case-insensitive compatison. As a temporary workaround, I've lowercased - * the FORCE_PREFIX. - * - * #define FORCE_PREFIX "IJB-FORCE-LOAD-" - */ -#define FORCE_PREFIX "ijb-force-load-" +#define FORCE_PREFIX "/IJB-FORCE-LOAD" #endif /* def FORCE_LOAD */ #define HOME_PAGE_URL "http://ijbswa.sourceforge.net/" #define REDIRECT_URL HOME_PAGE_URL "redirect.php?v=" VERSION "&to=" +static const char CFAIL[] = + "HTTP/1.0 503 Connect failed\n" + "Content-Type: text/html\n\n" + "\n" + "\n" + "Internet Junkbuster: Connect failed\n" + "\n" + BODY + "

" + BANNER + "

" + "TCP connection to '%s' failed: %s.\n
" + "\n" + "\n"; + +static const char CNXDOM[] = + "HTTP/1.0 404 Non-existent domain\n" + "Content-Type: text/html\n\n" + "\n" + "\n" + "Internet Junkbuster: Non-existent domain\n" + "\n" + BODY + "

" + BANNER + "

" + "No such domain: %s\n" + "\n" + "\n"; + +static const char CNOBANNER[] = + "HTTP/1.0 200 No Banner\n" + "Content-Type: text/html\n\n" + "\n" + "\n" + "Internet Junkbuster: No Banner\n" + "\n" + BODY + "

" + BANNER + "

" + "You asked for a banner that this proxy can't produce because either configuration does not permit.\n
" + "or the URL didn't end with .gif\n" + "\n" + "\n"; + +static const char CSUCCEED[] = + "HTTP/1.0 200 Connection established\n" + "Proxy-Agent: IJ/" VERSION "\n\n"; + +static const char CHEADER[] = + "HTTP/1.0 400 Invalid header received from browser\n\n"; + +static const char SHEADER[] = + "HTTP/1.0 502 Invalid header received from server\n\n"; + +#ifdef IMAGE_BLOCKING + +/* + * Hint: You can encode your own GIFs like that: + * perl -e 'while (read STDIN, $c, 1) { printf("\\%.3o,", unpack("C", $c)); }' + */ + +static const char BLANKGIF[] = + "HTTP/1.0 200 OK\r\n" + "Pragma: no-cache\r\n" + "Last-Modified: Thu Jul 31, 1997 07:42:22 pm GMT\r\n" + "Expires: Thu Jul 31, 1997 07:42:22 pm GMT\r\n" + "Content-type: image/gif\r\n\r\n" + "GIF89a\001\000\001\000\200\000\000\377\377\377\000\000" + "\000!\371\004\001\000\000\000\000,\000\000\000\000\001" + "\000\001\000\000\002\002D\001\000;"; + +static const char JBGIF[] = + "HTTP/1.0 200 OK\r\n" + "Pragma: no-cache\r\n" + "Last-Modified: Thu Jul 31, 1997 07:42:22 pm GMT\r\n" + "Expires: Thu Jul 31, 1997 07:42:22 pm GMT\r\n" + "Content-type: image/gif\r\n\r\n" + "GIF89aD\000\013\000\360\000\000\000\000\000\377\377\377!" + "\371\004\001\000\000\001\000,\000\000\000\000D\000\013\000" + "\000\002a\214\217\251\313\355\277\000\200G&K\025\316hC\037" + "\200\234\230Y\2309\235S\230\266\206\372J\253<\3131\253\271" + "\270\215\342\254\013\203\371\202\264\334P\207\332\020o\266" + "N\215I\332=\211\312\3513\266:\026AK)\364\370\365aobr\305" + "\372\003S\275\274k2\354\254z\347?\335\274x\306^9\374\276" + "\037Q\000\000;"; + +#endif /* def IMAGE_BLOCKING */ + +#if defined(FAST_REDIRECTS) || defined(IMAGE_BLOCKING) + +static const char HTTP_REDIRECT_TEMPLATE[] = + "HTTP/1.0 302 Local Redirect from Junkbuster\r\n" + "Pragma: no-cache\r\n" + "Last-Modified: Thu Jul 31, 1997 07:42:22 pm GMT\r\n" + "Expires: Thu Jul 31, 1997 07:42:22 pm GMT\r\n" + "Location: %s\r\n\r\n"; + +#endif /* defined(FAST_REDIRECTS) || defined(IMAGE_BLOCKING) */ + #ifdef __cplusplus } /* extern "C" */ #endif