Author Topic: Filters by Henk  (Read 2443 times)

Arne

  • Administrator
  • Hero Member
  • *****
  • Posts: 778
    • ICQ Messenger - 1448105
    • AOL Instant Messenger - aflaaten
    • Yahoo Instant Messenger - arneflaa
    • View Profile
    • http://
    • Email
Filters by Henk
« on: October 25, 2001, 09:51:09 PM »
Henk has posted a few of his filters, and I have placed them here as a collection:

FILTERS:

Name = "Lockergnome Cleaner"
#What - removes lockergnome "sidebar" text ads
#Example page - http://www.lockergnome.com/issues/daily.html
#Date - 10-22-01
Active = TRUE
URL = "www.lockergnome.com"
Bounds = "<p class="sidebar"><table*><tr><td>*</p>"
Limit = 3000
Match = "<p class="sidebar">$NEST(<table*>,</table>)</p>"

Name = "FreewarePublishing Cleaner"
#What - removes huge junk section from FPS
#Example page - http://www.katho.be/freeware/freeware.htm
#Date - 10-22-01
Active = TRUE
URL = "www.katho.be/freeware"
Limit = 32000
Match = "<!-+??????XX?X+?-+>*<!-+??????XX?X+?-+>"
Replace = "$STOP()"

Name = "FreewarePublishing Linkbuster"
#What - removes most spam&junk links from FPS
#Example page - http://www.katho.be/freeware/freeware.htm
#Date - 10-22-01
Active = TRUE
URL = "www.katho.be/freeware/"
Bounds = "<!--soft*<!--endsoft*>"
Limit = 4000
Match = "<!--soft*<!--info-->*($LST(Urls_usr))*<!--endsoft[^>]++>"

Name = "ZDNet Cleaner"
#What - removes page bottom junk part from ZDNet
#Example page - http://www.zdnet.com/pcmag/
#Date - 10-22-01
Active = TRUE
URL = "www.zdnet.com"
Limit = 256
Match = "<P ALIGN='center'>|<!--START SPONSORED LINKS-->"
Replace = "</body></html>k$STOP()"

Name = "LII Tracking Links Cleaner"
#What - converts the funny tracking links at Lii to normal urls
#Example page - http://lii.org/search?title=New+Th
is+Week&query=New+this+week&subsearch=New+this+week&searchtype=subject
#Date - 10-22-01
Active = TRUE
URL = "lii.org"
Bounds = "<a href=*</font>"
Limit = 256
Match = "<A HREF="/search?goto=[#1-*]">*2</A>*http://1</FONT>"
Replace = "<a href="http://1">2</a>"

Name = "Yahoo Form Filler"
#What - Needed because of using session-only cookies
#Example page - http://login.yahoo.com/config/logi
n?.intl=us&.src=ygrp&.done=http://groups.yahoo.com
%2Fgroup%2Fprox-list%2F
#Date - 10-22-01
Active = TRUE
URL = "login.yahoo.com"
Limit = 1000
Match = "<input name="login" size="17" maxlength="32"
value="">(*)1<input name="passwd""
Replace = "<input name="login" size="17" maxlength="32"
value="myusername">1<input name="passwd" value="mypassword""
          "$STOP()"

Name = "Tucows Freeware Links Only"
#What - remove non-freeware from Tucows (leaving GPL, freeware in
place)
#Example page - http://tucows.nl.uu.net/whatsnew.html
#Date - 10-22-01
Active = TRUE
Multi = TRUE
URL = "tucows.nl.uu.net"
Bounds = "<!-- Current program set to*<!--"
Limit = 2000
Match = "<!-- Current program set to [#0-*] -->*((
share|ad)ware|demo|commerc*)<*<!--"
Replace = "<!--"

Name = "Koodles Cleaner part 1"
#What - remove Koodles top and sidebar junk
#Example page - http://www.fileclicks.com/?show=2
#Date - 10-22-01
Active = TRUE
URL = "www.fileclicks.com"
Bounds = "<table width="760"*<img src="kooimgs/tab
s/FileDirectory.gif""
Limit = 14000
Match = "<table width="760"*<img src="kooimgs/tabs/FileDirectory.gif""
Replace = "<table width="100%" border="0" cellspacing="0"
cellpadding="0">"
          "<tr>"
          "<td valign="top" width="466">"
          "<table width="450" border="0" cellspacing="0"
cellpadding="0" align="center">"
          "<tr>"
          "<td valign="top" align="left" colspan="3">"
          "<img src="kooimgs/tabs/FileDirectory.gif"$STOP()"

Name = "Koodles Cleaner part 2"
#What - remove Koodles page bottom junk
#Example page -
#Date - 10-22-01
Active = TRUE
URL = "www.fileclicks.com"
Bounds = "<b>..Old Blurbs*</div>"
Limit = 256
Match = "<b>..Old Blurbs</b></a></td>*</tr>*</table>*</div>"
Replace = "<b>..Old Blurbs</b></a></td></tr></table></div>"
          "</body></html>k$STOP()"

Name = "UnBold Bold Text"
#What - removing all that overused bold makes pages much more serene
(use css too)
#Example page - wherever
#Date - 10-22-01
Active = TRUE
Multi = TRUE
Bounds = "<(/|)(b|s)*>"
Limit = 20
Match = "<(/|)(b(s*|link|)|strong)>"
Replace = "<!--b-->"

Name = "Show Link Instead of Auto-Redirection"
#What - instead of killing redirection, which leaves no choice, make
it a link
#Example page - all pages that use simple redirection
#Date - 10-22-01
Active = TRUE
Bounds = "<(meta*|script*</script)>"
Limit = 512
Match = "<(meta http-equiv="refresh" content="[#0-15]; URL=(w)1 * |"
        "script>*document.location.replace(("|**FIX**|) 1
("|**FIX**|))*</script)>"
Replace = "<font size=2><tt>This page would have redirected you to <a
href="1">1</A></tt></font><hr size=1>"
          "$STOP()"

Name = "Hide ImageMaps by Text"
#What - hide imagemaps that somewhere contain "unwanted" blocklist
strings
#Example page - depends from what's in your Keywords blocklist
#Date - 10-22-01
Active = TRUE
Bounds = "<im(g|age)s*usemap*>"
Limit = 1024
Match = "<im(g|age)s*$LST(Keyw_def)*>"
Replace = "<img src=dbluebar.gif width=25 height=7 alt="" border=0>"

Name = "Kill Unwanted Forms (debug version)"
#What - debug for filter below, indicates what string caused a match
#Example page - depends from what's in your Forms blocklist
#Date - 10-22-01
Active = FALSE
URL = "^(grc.com|(web|www).altavista.com|(login|groups).yahoo.com)"
Bounds = "<forms*</form>"
Limit = 8000
Match = "<form*($LST(Forms_Def))1*</form>"
Replace = "<a href="http://bweb..hpq"><img src=dmauvebar.gif
width=40 height=11 alt="" border=0>"
          "</a> HIT=1"

Name = "Kill Unwanted Forms (normal version)"
#What - hide forms that somewhere contain "unwanted" blocklist strings
#Example page - depends from what's in your Forms blocklist
#Date - 10-22-01
Active = TRUE
URL = "^(grc.com|(web|www).altavista.com|astalavis
ta.box.sk|login.yahoo.com)"
Bounds = "<forms*</form>"
Limit = 8000
Match = "<form*$LST(Forms_Def)*</form>"
Replace = "<a href="http://bweb..hpq"><img src=dmauvebar.gif
width=40 height=11 alt="" border=0></a>"

Name = "Hide Unwanted Links by URL (debug version)"
#What - debug for filter below, indicates what string caused a match
#Example page - depends from what's in your User Urls blocklist
#Date - 10-22-01
Active = FALSE
URL = "^(infomine.ucr|sosig.ac.)"
Bounds = "<as[^n]*>*</a>"
Limit = 1024
Match = "(<as*href=$AV(*($LST(Urls_usr))1*)*>)*</*"
Replace = "<img src=dgreenbar.gif width=25 height=7 alt=""
border=0></a> HIT=1"

Name = "Hide Unwanted Links by URL (normal version)"
#What - hide links that contain "unwanted" blocklist strings in URL
part
#Example page - depends from what's in your User Urls blocklist
#Date - 10-22-01
Active = TRUE
Multi = TRUE
URL = "^(infomine.ucr|sosig.ac.|www.online-books.l
ibrary|www.socsci.kun.nl)"
Bounds = "<as[^n]*>*</a>"
Limit = 1024
Match = "(<as*href=$AV(*$LST(Urls_usr)*)*>*)*</*"
Replace = "<img src=dgreenbar.gif width=25 height=7 alt=""
border=0></a>"

Name = "Hide Unwanted Links by Text (debug version)"
#What - debug for filter below, indicates what string caused a match
#Example page - depends from what's in your Keywords blocklist
#Date - 10-22-01
Active = FALSE
URL = "^(groups.yahoo|digital.library|sosig.ac|www.ipl.org)"
Bounds = "<as[^n]*>*</a>"
Limit = 1024
Match = "(<as[^n]*>)($LST(Keyw_def))1*"
Replace = "<img src=dbluebar.gif width=25 height=7 alt=""
border=0></a> HIT=1"

Name = "Hide Unwanted Links by Text (normal version)"
#What - hide links that contain "unwanted" blocklist strings in
anchortext part
#Example page - depends from what's in your Keywords blocklist
#Date - 10-22-01
Active = TRUE
Multi = TRUE
URL = "^(groups.yahoo|digital.library|sosig.ac|www
.ipl.org|www.online-books.library|www.dailyrotation)"
Bounds = "<as[^n]*>*</a>"
Limit = 1024
Match = "(<as[^n]*>)$LST(Keyw_def)*"
Replace = "<img src=dbluebar.gif width=25 height=7 alt=""
border=0></a>"

Name = "Strip JScripted URLs"
#What - convert links like ..href=javascript.openwin(URL, size...) to
normal
#Example page -
#Date - 10-22-01
Active = TRUE
Multi = TRUE
Bounds = "<as*=("|')javascript:*>"
Limit = 512
Match = "<as*href=("|')javascript:w(("|')(*)1("|')*>"
Replace = "<a href="1">"

...Henk


Best wishes
Arne
Imici username: Arne
Best wishes
Arne
Imici username= Arne