Old Proxomitron Forums
Proxomitron Filters - Discussions welcome => Block List Files => Topic started by: Arne on October 25, 2001, 09:51:09 PM
-
Henk has posted a few of his filters, and I have placed them here as a collection:
FILTERS:
Name = "Lockergnome Cleaner"
#What - removes lockergnome "sidebar" text ads
#Example page - http://www.lockergnome.com/issues/daily.html
#Date - 10-22-01
Active = TRUE
URL = "www.lockergnome.com"
Bounds = "<p class="sidebar"><table*><tr><td>*</p>"
Limit = 3000
Match = "<p class="sidebar">$NEST(<table*>,</table>)</p>"
Name = "FreewarePublishing Cleaner"
#What - removes huge junk section from FPS
#Example page - http://www.katho.be/freeware/freeware.htm
#Date - 10-22-01
Active = TRUE
URL = "www.katho.be/freeware"
Limit = 32000
Match = "<!-+??????XX?X+?-+>*<!-+??????XX?X+?-+>"
Replace = "$STOP()"
Name = "FreewarePublishing Linkbuster"
#What - removes most spam&junk links from FPS
#Example page - http://www.katho.be/freeware/freeware.htm
#Date - 10-22-01
Active = TRUE
URL = "www.katho.be/freeware/"
Bounds = "<!--soft*<!--endsoft*>"
Limit = 4000
Match = "<!--soft*<!--info-->*($LST(Urls_usr))*<!--endsoft[^>]++>"
Name = "ZDNet Cleaner"
#What - removes page bottom junk part from ZDNet
#Example page - http://www.zdnet.com/pcmag/
#Date - 10-22-01
Active = TRUE
URL = "www.zdnet.com"
Limit = 256
Match = "<P ALIGN='center'>|<!--START SPONSORED LINKS-->"
Replace = "</body></html>k$STOP()"
Name = "LII Tracking Links Cleaner"
#What - converts the funny tracking links at Lii to normal urls
#Example page - http://lii.org/search?title=New+Th
is+Week&query=New+this+week&subsearch=New+this+week&searchtype=subject
#Date - 10-22-01
Active = TRUE
URL = "lii.org"
Bounds = "<a href=*</font>"
Limit = 256
Match = "<A HREF="/search?goto=[#1-*]">*2</A>*http://1</FONT>"
Replace = "<a href="http://1">2</a>"
Name = "Yahoo Form Filler"
#What - Needed because of using session-only cookies
#Example page - http://login.yahoo.com/config/logi
n?.intl=us&.src=ygrp&.done=http://groups.yahoo.com
%2Fgroup%2Fprox-list%2F
#Date - 10-22-01
Active = TRUE
URL = "login.yahoo.com"
Limit = 1000
Match = "<input name="login" size="17" maxlength="32"
value="">(*)1<input name="passwd""
Replace = "<input name="login" size="17" maxlength="32"
value="myusername">1<input name="passwd" value="mypassword""
"$STOP()"
Name = "Tucows Freeware Links Only"
#What - remove non-freeware from Tucows (leaving GPL, freeware in
place)
#Example page - http://tucows.nl.uu.net/whatsnew.html
#Date - 10-22-01
Active = TRUE
Multi = TRUE
URL = "tucows.nl.uu.net"
Bounds = "<!-- Current program set to*<!--"
Limit = 2000
Match = "<!-- Current program set to [#0-*] -->*((
share|ad)ware|demo|commerc*)<*<!--"
Replace = "<!--"
Name = "Koodles Cleaner part 1"
#What - remove Koodles top and sidebar junk
#Example page - http://www.fileclicks.com/?show=2
#Date - 10-22-01
Active = TRUE
URL = "www.fileclicks.com"
Bounds = "<table width="760"*<img src="kooimgs/tab
s/FileDirectory.gif""
Limit = 14000
Match = "<table width="760"*<img src="kooimgs/tabs/FileDirectory.gif""
Replace = "<table width="100%" border="0" cellspacing="0"
cellpadding="0">"
"<tr>"
"<td valign="top" width="466">"
"<table width="450" border="0" cellspacing="0"
cellpadding="0" align="center">"
"<tr>"
"<td valign="top" align="left" colspan="3">"
"<img src="kooimgs/tabs/FileDirectory.gif"$STOP()"
Name = "Koodles Cleaner part 2"
#What - remove Koodles page bottom junk
#Example page -
#Date - 10-22-01
Active = TRUE
URL = "www.fileclicks.com"
Bounds = "<b>..Old Blurbs*</div>"
Limit = 256
Match = "<b>..Old Blurbs</b></a></td>*</tr>*</table>*</div>"
Replace = "<b>..Old Blurbs</b></a></td></tr></table></div>"
"</body></html>k$STOP()"
Name = "UnBold Bold Text"
#What - removing all that overused bold makes pages much more serene
(use css too)
#Example page - wherever
#Date - 10-22-01
Active = TRUE
Multi = TRUE
Bounds = "<(/|)(b|s)*>"
Limit = 20
Match = "<(/|)(b(s*|link|)|strong)>"
Replace = "<!--b-->"
Name = "Show Link Instead of Auto-Redirection"
#What - instead of killing redirection, which leaves no choice, make
it a link
#Example page - all pages that use simple redirection
#Date - 10-22-01
Active = TRUE
Bounds = "<(meta*|script*</script)>"
Limit = 512
Match = "<(meta http-equiv="refresh" content="[#0-15]; URL=(w)1 * |"
"script>*document.location.replace(("|**FIX**|) 1
("|**FIX**|))*</script)>"
Replace = "<font size=2><tt>This page would have redirected you to <a
href="1">1</A></tt></font><hr size=1>"
"$STOP()"
Name = "Hide ImageMaps by Text"
#What - hide imagemaps that somewhere contain "unwanted" blocklist
strings
#Example page - depends from what's in your Keywords blocklist
#Date - 10-22-01
Active = TRUE
Bounds = "<im(g|age)s*usemap*>"
Limit = 1024
Match = "<im(g|age)s*$LST(Keyw_def)*>"
Replace = "<img src=dbluebar.gif width=25 height=7 alt="" border=0>"
Name = "Kill Unwanted Forms (debug version)"
#What - debug for filter below, indicates what string caused a match
#Example page - depends from what's in your Forms blocklist
#Date - 10-22-01
Active = FALSE
URL = "^(grc.com|(web|www).altavista.com|(login|groups).yahoo.com)"
Bounds = "<forms*</form>"
Limit = 8000
Match = "<form*($LST(Forms_Def))1*</form>"
Replace = "<a href="http://bweb..hpq"><img src=dmauvebar.gif
width=40 height=11 alt="" border=0>"
"</a> HIT=1"
Name = "Kill Unwanted Forms (normal version)"
#What - hide forms that somewhere contain "unwanted" blocklist strings
#Example page - depends from what's in your Forms blocklist
#Date - 10-22-01
Active = TRUE
URL = "^(grc.com|(web|www).altavista.com|astalavis
ta.box.sk|login.yahoo.com)"
Bounds = "<forms*</form>"
Limit = 8000
Match = "<form*$LST(Forms_Def)*</form>"
Replace = "<a href="http://bweb..hpq"><img src=dmauvebar.gif
width=40 height=11 alt="" border=0></a>"
Name = "Hide Unwanted Links by URL (debug version)"
#What - debug for filter below, indicates what string caused a match
#Example page - depends from what's in your User Urls blocklist
#Date - 10-22-01
Active = FALSE
URL = "^(infomine.ucr|sosig.ac.)"
Bounds = "<as[^n]*>*</a>"
Limit = 1024
Match = "(<as*href=$AV(*($LST(Urls_usr))1*)*>) *</*"
Replace = " <img src=dgreenbar.gif width=25 height=7 alt=""
border=0></a> HIT=1"
Name = "Hide Unwanted Links by URL (normal version)"
#What - hide links that contain "unwanted" blocklist strings in URL
part
#Example page - depends from what's in your User Urls blocklist
#Date - 10-22-01
Active = TRUE
Multi = TRUE
URL = "^(infomine.ucr|sosig.ac.|www.online-books.l
ibrary|www.socsci.kun.nl)"
Bounds = "<as[^n]*>*</a>"
Limit = 1024
Match = "(<as*href=$AV(*$LST(Urls_usr)*)*>*) *</*"
Replace = " <img src=dgreenbar.gif width=25 height=7 alt=""
border=0></a>"
Name = "Hide Unwanted Links by Text (debug version)"
#What - debug for filter below, indicates what string caused a match
#Example page - depends from what's in your Keywords blocklist
#Date - 10-22-01
Active = FALSE
URL = "^(groups.yahoo|digital.library|sosig.ac|www.ipl.org)"
Bounds = "<as[^n]*>*</a>"
Limit = 1024
Match = "(<as[^n]*>) ($LST(Keyw_def))1*"
Replace = " <img src=dbluebar.gif width=25 height=7 alt=""
border=0></a> HIT=1"
Name = "Hide Unwanted Links by Text (normal version)"
#What - hide links that contain "unwanted" blocklist strings in
anchortext part
#Example page - depends from what's in your Keywords blocklist
#Date - 10-22-01
Active = TRUE
Multi = TRUE
URL = "^(groups.yahoo|digital.library|sosig.ac|www
.ipl.org|www.online-books.library|www.dailyrotation)"
Bounds = "<as[^n]*>*</a>"
Limit = 1024
Match = "(<as[^n]*>) $LST(Keyw_def)*"
Replace = " <img src=dbluebar.gif width=25 height=7 alt=""
border=0></a>"
Name = "Strip JScripted URLs"
#What - convert links like ..href=javascript.openwin(URL, size...) to
normal
#Example page -
#Date - 10-22-01
Active = TRUE
Multi = TRUE
Bounds = "<as*=("|')javascript:*>"
Limit = 512
Match = "<as*href=("|')javascript:w(("|')(*)1("|')*>"
Replace = "<a href="1">"
...Henk
Best wishes
Arne
Imici username: Arne