X-Git-Url: http://www.privoxy.org/gitweb/?p=privoxy.git;a=blobdiff_plain;f=default.filter;h=d9fcb3826325d357c3757dbdeb9aabaeaba8b2a2;hp=728a7186fc9e98c6768373537fff0510cb276408;hb=1fafdd0184d40f4f90b0f38866f8606568589db5;hpb=472006f94cd350ff6e734c156cbbb93dab86d864 diff --git a/default.filter b/default.filter index 728a7186..d9fcb382 100644 --- a/default.filter +++ b/default.filter @@ -2,17 +2,13 @@ # # File : $Source: /cvsroot/ijbswa/current/default.filter,v $ # -# $Id: basic.action,v 1.3 2002/03/26 22:29:54 swa Exp $ +# $Id: default.filter,v 1.12 2002/09/05 14:55:38 oes Exp $ # # Purpose : Rules to process the content of web pages # # Copyright : Written by and Copyright # Privoxy team. http://www.privoxy.org/ # -# Based on the Internet Junkbuster originally written -# by and Copyright (C) 1997 Anonymous Coders and -# Junkbusters Corporation. http://www.junkbusters.com -# # We value your feedback. However, to provide you with the best support, # please note: # @@ -21,7 +17,7 @@ # * Submit bugs only thru our bug forum: # http://sourceforge.net/tracker/?group_id=11118&atid=111118 # Make sure that the bug has not already been submitted. Please try -# to verify that it is a Junkbuster bug, and not a browser or site +# to verify that it is a Privoxy bug, and not a browser or site # bug first. If you are using your own custom configuration, please # try the stock configs to see if the problem is a configuration # related bug. And if not using the latest development snapshot, @@ -66,48 +62,70 @@ ################################################################################# # -# html-annoyances: Get rid of particularly annoying HTML abuse +# js-annoyances: Get rid of particularly annoying JavaScript abuse # ################################################################################# -FILTER: html-annoyances Get rid of particularly annoying HTML abuse +FILTER: js-annoyances Get rid of particularly annoying JavaScript abuse -# New browser windows (if allowed -- see no-popups filter below) should be -# resizeable and have a location and status bar +# Note: Most of these jobs would be safer if restricted to a +# )|$1never|sigU + +# If we allow window.open, we want normal window features: +# Test: http://www.htmlgoodies.com/beyond/notitle.html +# +s/(open\s*\([^\)]+resizable=)(["']?)(?:no|0)\2/$1$2yes$2/sigU +s/(open\s*\([^\)]+location=)(["']?)(?:no|0)\2/$1$2yes$2/sigU +s/(open\s*\([^\)]+status=)(["']?)(?:no|0)\2/$1$2yes$2/sigU +s/(open\s*\([^\)]+scroll(?:ing|bars)=)(["']?)(?:no|0)\2/$1$2auto$2/sigU +s/(open\s*\([^\)]+menubar=)(["']?)(?:no|0)\2/$1$2yes$2/sigU +s/(open\s*\([^\)]+toolbar=)(["']?)(?:no|0)\2/$1$2yes$2/sigU +s/(open\s*\([^\)]+directories=)(["']?)(?:no|0)\2/$1$2yes$2/sigU +s/(open\s*\([^\)]+fullscreen=)(["']?)(?:yes|1)\2/$1$2no$2/sigU +s/(open\s*\([^\)]+always(?:raised|lowered)=)(["']?)(?:yes|1)\2/$1$2no$2/sigU +s/(open\s*\([^\)]+zlock=)(["']?)(?:yes|1)\2/$1$2no$2/sigU +s/(open\s*\([^\)]+hotkeys=)(["']?)(?:yes|1)\2/$1$2no$2/sigU +s/(open\s*\([^\)]+titlebar=)(["']?)(?:yes|1)\2/$1$2yes$2/sigU ################################################################################# # -# js-annoyances: Get rid of particularly annoying JavaScript abuse +# html-annoyances: Get rid of particularly annoying HTML abuse # ################################################################################# -FILTER: js-annoyances Get rid of particularly annoying JavaScript abuse - -# Get rid of Javascript referrer tracking. Test page: http://www.randomoddness.com/untitled.htm -# -s|()|$1"Not Your Business!"$2|Usg +FILTER: html-annoyances Get rid of particularly annoying HTML abuse -# The status bar is for displaying link targets, not pointless blahblah +# New browser windows (if allowed -- see no-popups filter below) should be +# resizeable and have a location and status bar # -s/status='.*?';*//ig +s/(]+resizable=)(['"]?)(?:no|0)\2/$1$2yes$2/igU +s/(]+location=)(['"]?)(?:no|0)\2/$1$2yes$2/igU +s/(]+status=)(['"]?)(?:no|0)\2/$1$2yes1$2/igU +s/(]+scrolling=)(['"]?)(?:no|0)\2/$1$2auto$2/igU +s/(]+menubar=)(['"]?)(?:no|0)\2/$1$2yes$2/igU -# Kill OnUnload popups. Yummy. Test: http://www.zdnet.com/zdsubs/yahoo/tree/yfs.html +# The tag was a crime! # -s/()/$1never$2/iU +s*|**ig ################################################################################# @@ -119,57 +137,143 @@ FILTER: content-cookies Kill cookies that come in the HTML or JS content # JS cookies, like found on privacy.net: # -s|(document\.cookie)([ \t\r\n]*=)|documenZapCooky$2|g +s|document\.cookie(?=[ \t\r\n]*=)|ZappedCookie|ig # HTML cookies: # -s|].*>||iUT +s|||igU + + +################################################################################# +# +# webbugs: Squish WebBugs (1x1 invisible GIFs used for user tracking) +# +################################################################################# +FILTER: webbugs Squish WebBugs (1x1 invisible GIFs used for user tracking) + +s/]*(?:width|height)\s*=\s*['"]?1(?=\D)[^>]*(?:width|height)\s*=\s*['"]?1(?=\D)[^>]*?>//siUg ################################################################################## # -# no-popups: Kill all popups in JS and HTML +# popups: Kill all popups in JS and HTML # ################################################################################# -FILTER: no-popups Kill all popups in JS and HTML +FILTER: popups Kill all popups in JS and HTML + +s/([\n =;{}]|window\.)open\s*\\?\(/$1concat(/ig # JavaScript +s/ target\s*=\s*(['"]?)(_blank|_new)\1?/ notarget/ig # HTML -s/window\.open\(/1;''\.concat\(/ig # JavaScript -s/target=['"]?_blank['"]?/target_crunched/ig # HTML -s/target=['"]?_new['"]?/target_crunched/ig # HTML ################################################################################# # -# frameset-borders: Give frames a border and make them resizable +# frameset-borders: Give frames a border, make them resizable and scrollable # ################################################################################# FILTER: frameset-borders Give frames a border and make them resizable -s/(]+)framespacing=['"]?(no|0)['"]?(.*>)/$1$3/igU -s/(]+)frameborder=['"]?(no|0)['"]?(.*>)/$1$3/igU -s/(]+)border=['"]?(no|0)['"]?(.*>)/$1$3/igU -s/(]+)resizable=['"]?(no|0|false)['"]?(.*>)/$1$3/igU +s/(]*)framespacing=(['"]?)(no|0)\2/$1/igU +s/(]*)frameborder=(['"]?)(no|0)\2/$1/igU +s/(]*)border=(['"]?)(no|0)\2/$1/igU +s/(]*)noresize/$1/igU +s/(]*)frameborder=(['"]?)(no|0)\2/$1/igU +s/(]*)scrolling=(['"]?)(no|0)\2/$1/igU + ################################################################################# # -# webbugs: Squish WebBugs (1x1 invisible GIFs used for user tracking) +# refresh-tags: Kill automatic refresh tags (for dial-on-demand setups) # ################################################################################# -FILTER: webbugs Squish WebBugs (1x1 invisible GIFs used for user tracking) +FILTER: refresh-tags Kill automatic refresh tags (for dial-on-demand setups) -s/]*?(width|height)\s*=\s*['"]?1\D[^>]*?(width|height)\s*=\s*['"]?1(\D[^>]*?)?>//sig +# Note: Only deactivates refreshes with more than 9 seconds delay to +# preserve monster-stupid but common redirections via meta tags. +# +s/\2]*))?\2\s*>//iU ################################################################################# # -# no-refresh: Kill automatic refresh tags (for dial-on-demand setups) +# img-reorder: Reorder attributes in tags to make the banners-by-* filters more effective # ################################################################################# -FILTER: no-refresh Kill automatic refresh tags (for dial-on-demand setups) +FILTER: img-reorder Reorder attributes in tags to make the banners-by-* filters more effective -s/]*)['"]?>//iU -s/].*>//iU +# In the first step src is moved to the start, then width is moved to the second +# place to guarantee an order of src, width, height. +# This makes banners-by-size more effective and allows both banners-by-size +# and banners-by-link to preserve the original image URL in the alt attribute. + +s|]*)src\s*=\s*(['"])([^>\\\2]+)\2|]*)src\s*=\s*([^'">\\\s]+)|\\\\2]+\2\|[^'">\\\s]+?))([^>]*)width\s*=\s*(["']?)(\d+?)|\\\1\s]+)\1)?[^>]*?(width=(['"]?)88\4)[^>]*?(height=(['"]?)31\6)[^>]*>@$1Killed-$2-by-size$1@sig +# 120*60, 120*90, 120*240, 120*600 +s@\\\1\s]+)\1)?[^>]*?(width=(['"]?)120\4)[^>]*?(height=(['"]?)(?:600?|90|240)\6)[^>]*>@$1Killed-$2-by-size$1@sig +# 125*125 +s@\\\1\s]+)\1)?[^>]*?(width=(['"]?)125\4)[^>]*?(height=(['"]?)125\6)[^>]*>@$1Killed-$2-by-size$1@sig +# 160*600 +s@\\\1\s]+)\1)?[^>]*?(width=(['"]?)160\4)[^>]*?(height=(['"]?)600\6)[^>]*>@$1Killed-$2-by-size$1@sig +# 180*150 +s@\\\1\s]+)\1)?[^>]*?(width=(['"]?)180\4)[^>]*?(height=(['"]?)150\6)[^>]*>@$1Killed-$2-by-size$1@sig +# 234*60, 468*60 (Most Banners!) +s@\\\1\s]+)\1)?[^>]*?(width=(['"]?)(?:234|468)\4)[^>]*?(height=(['"]?)60\6)[^>]*>@$1Killed-$2-by-size$1@sig +# 240*400 +s@\\\1\s]+)\1)?[^>]*?(width=(['"]?)240\4)[^>]*?(height=(['"]?)400\6)[^>]*>@$1Killed-$2-by-size$1@sig +# 250*250, 300*250 +s@\\\1\s]+)\1)?[^>]*?(width=(['"]?)(?:250|300)\4)[^>]*?(height=(['"]?)250\6)[^>]*>@$1Killed-$2-by-size$1@sig +# 336*280 +s@\\\1\s]+)\1)?[^>]*?(width=(['"]?)336\4)[^>]*?(height=(['"]?)280\6)[^>]*>@$1Killed-$2-by-size$1@sig + +# Note: 200*50 was also proposed, but it probably causes too much collateral damage: +# +#s@\\\1\s]+)\1)?[^>]*?(width=(['"]?)200\4)[^>]*?(height=(['"]?)50\6)[^>]*>@$1Killed-$2-by-size$1@sig + + +################################################################################# +# +# banners-by-link: Kill banners by their links to known clicktrackers +# +################################################################################# +FILTER: banners-by-link Kill banners by their links to known clicktrackers + +# Common case with width and height attributes: +# +s@\1\s]*?(?:\ + adclick # See www.dn.se \ +| atwola\.com/(?:link|redir) # see www.cnn.com \ +| /jump/ # redirs for doublecklick.net ads \ +| tracker | counter # common \ +| adlog\.pl # see sf.net \ +)[^>\1\s]*)\1[^>]*>\s*\\\3\s]+)\3)?[^>]*((?:width|height)\s*=\s*(['"]?)\d+?\6)[^>]*((?:width|height)\s*=\s*(['"]?)\d+?\8)[^>]*>\ +@$1Killed@sigx + +# Rare case w/o explicit dimensions: +# +s@\1\s]*?(?:adclick|atwola\.com/(?:link|redir)|doubleclick\.net/jump/|tracker|counter|adlog\.pl)[^>\1\s]*)\1[^>]*>\s*\\\3\s]+)\3)?[^>]*>@$1Killed@sig + ################################################################################# # # fun: Text replacements for subversive browsing fun! @@ -179,17 +283,19 @@ FILTER: fun Text replacements for subversive browsing fun! s/microsoft(?!.com)/MicroSuck/ig -# Buzzword Bingo (example for extended syntax) +# Buzzword Bingo (example for extended regex syntax) # s* industry[ -]leading \ | cutting[ -]edge \ +| customer[ -]focused \ +| market[ -]driven \ | award[ -]winning # Comments are OK, too! \ | high[ -]performance \ | solutions[ -]based \ | unmatched \ | unparalleled \ | unrivalled \ -*BINGO! \ +*BINGO! \ *igx @@ -200,42 +306,39 @@ s* industry[ -]leading \ ################################################################################# FILTER: nimda Remove Nimda (virus) code -s%%

Internet JUNKBUSTER WARNING: This Server is infected with Nimda!%g +s%%
WARNING: This Server is infected with Nimda!%g ################################################################################# # -# banners-by-size: Kill banners by size +# shockwave-flash: Kill embedded Shockwave Flash objects # +################################################################################# +FILTER: shockwave-flash Kill embedded Shockwave Flash objects + +s|]*application/x-shockwave-flash.*||sigU + + ################################################################################# # -# Standard banner sizes taken from http://www.iab.net/iab_banner_standards/bannersizes.html -# -# Note: Use http://config.privoxy.org/send-banner?type=trans for a transparent 1x1 image -# Use http://config.privoxy.org/send-banner?type=pattern for a grey/white pattern image -# Use http://config.privoxy.org/send-banner?type=auto to auto-select. +# quicktime-kioskmode: Make Quicktime movies saveable # ################################################################################# -FILTER: banners-by-size Kill banners by size +FILTER: quicktime-kioskmode Make Quicktime movies saveable + +s/(]*)kioskmode\s*=\s*(["']?)true\2/$1/ig -s|]*?(width=['"]?468\D)[^>]*(height=['"]?60[^>]*?)>||sig -s|]*?(width=['"]?234\D)[^>]*(height=['"]?60[^>]*?)>||sig -s|]*?(width=['"]?88\D)[^>]*(height=['"]?31[^>]*?)>||sig -s|]*?(width=['"]?120\D)[^>]*(height=['"]?90[^>]*?)>||sig -s|]*?(width=['"]?120\D)[^>]*(height=['"]?600[^>]*?)>||sig -s|]*?(width=['"]?120\D)[^>]*(height=['"]?60[^>]*?)>||sig -s|]*?(width=['"]?160\D)[^>]*(height=['"]?600[^>]*?)>||sig -s|]*?(width=['"]?125\D)[^>]*(height=['"]?125[^>]*?)>||sig -s|]*?(width=['"]?120\D)[^>]*(height=['"]?240[^>]*?)>||sig -s|]*?(width=['"]?180\D)[^>]*(height=['"]?150[^>]*?)>||sig -s|]*?(width=['"]?300\D)[^>]*(height=['"]?250[^>]*?)>||sig -s|]*?(width=['"]?250\D)[^>]*(height=['"]?250[^>]*?)>||sig -s|]*?(width=['"]?240\D)[^>]*(height=['"]?400[^>]*?)>||sig -s|]*?(width=['"]?336\D)[^>]*(height=['"]?280[^>]*?)>||sig -# One more. (Where is 200x50 from?) +################################################################################# +# +# js-events: Kill all JS event bindings (Radically destructive! Only for extra nasty sites) # -s|]*?(width=['"]?200\D)[^>]*(height=['"]?50[^>]*?)>||sig +################################################################################# +FILTER: js-events Kill all JS event bindings (Radically destructive! Only for extra nasty sites) + +s/(on|event\.)((mouse(over|out|down|up|move))|(un)?load|contextmenu|selectstart)/never/ig +# Not events, but abused on the same type of sites: +s/(alert|confirm)\s*\(/concat(/ig ################################################################################# @@ -244,20 +347,63 @@ s|]*?(width=['"]?200\D)[^>]*(height=['"]?50[^>]*?)>|Blocked

Blocked due to possible adult content. Please see this site.

%is s+^.*warez.*$+No Warez

You're not searching for illegal stuff, are you?

+is + ############################################################################## # # Revisions : # $Log: default.filter,v $ +# Revision 1.12 2002/09/05 14:55:38 oes +# Synced with the stable branch: +# Revision 1.11.2.6 2002/08/23 14:12:26 oes +# Proofed frameset-borders against "fremaborder=0 border=0" +# +# Revision 1.11.2.5 2002/08/22 15:05:20 oes +# Added Filter to make Quicktime movies saveable (thanks to aaron@linville.org for the idea) +# +# Revision 1.11.2.4 2002/08/10 11:32:29 oes +# Attribute values in replacement tags of banners-by-size filter now undelimited. (Fixes bug #592493) +# +# Revision 1.11.2.3 2002/08/05 11:43:56 oes +# Fixed a bug in the popups filter that was introduced with the last fix :-( +# +# Revision 1.11.2.2 2002/08/01 11:20:13 oes +# Fixed bugs 587802, 577802 and an unreported one +# +# Revision 1.11.2.1 2002/07/26 15:18:26 oes +# - All filters reviewed and many shorcomings fixed +# - New filters: img-reorder, banners-by-link and js-events +# - Jobs reorderd because they are now executed in order of +# appearance +# +# Revision 1.11 2002/05/24 00:57:18 oes +# Made WeBugs job ungreedy; Fixes bug 559190 +# +# Revision 1.10 2002/04/18 10:14:19 oes +# renamed some filters +# +# Revision 1.9 2002/04/11 07:36:35 oes +# Generalized js-popup filter +# +# Revision 1.8 2002/04/10 17:07:21 oes +# Fixed potentially desctructive jobs, added noflash filter +# +# Revision 1.7 2002/04/09 18:34:51 oes +# Fixed HTML syntax in replacements +# +# Revision 1.6 2002/04/03 19:49:52 swa +# name change +# +# Revision 1.5 2002/03/27 15:30:26 swa +# have a consistent appearance +# # Revision 1.4 2002/03/26 22:29:54 swa # we have a new homepage! #