Difference between revisions of "Meta:Spam Blacklist"

From Perplex City Wiki
Jump to: navigation, search
 
(10 intermediate revisions by 2 users not shown)
Line 27: Line 27:
 
dgo5d.info
 
dgo5d.info
 
ringtone
 
ringtone
 +
 +
# More spam terms, added 2007-06-10
 +
diazepam
 +
xenical
 +
ringtones
 +
wellbutrin
 +
ativan
 +
viagra
 +
lorazepam
 +
vicodin
 +
 +
# Pages that have been hacked (the spam keywords aren't in the URL, so blacklist isn't effective against the link)
 +
stanford.edu/seminar
 +
sunysb.edu
 +
bc.edu
 +
sc.edu
 +
ku.edu
 +
usc.edu
 +
msoe.edu
 +
 +
# More spammy URLs from 2007-08-17
 +
helmed.info
 +
nobinters.org
 +
davte.info
 +
amohseni.info
 +
psisemiya.com
 +
ashythro.info
 +
kinuia.cn
 +
 +
# More on 2007-08-19
 +
ifrance.com
 +
 +
# 2007-08-22
 +
rigour.info
 +
110mb.com
 +
 +
#2007-08-30
 +
sneck.info
 +
primonona.info
 +
funkall.us
 +
veggis.org
 +
klohy.info
 +
budget7i.info
 +
svike.info
 +
manoke.cn
 +
xionny.cn
 +
wedner.info
 +
soler.net.cn
 +
polex.com.cn
 +
 +
#2008-08-07
 +
chaosantiques.com
 +
travelchinaplanner.com
 +
hkcbn.org
 +
16885.com
  
 
  #</pre> <!-- leave this line exactly as it is -->
 
  #</pre> <!-- leave this line exactly as it is -->

Latest revision as of 17:31, 7 August 2008

#
 
#
# In simple terms:
#    * Everything from a "#" character to the end of the line is a comment
#    * Every non-blank line is a regex fragment which will only match inside URLs
#
# Internally, a regex is formed which looks like this:
#
#    !http://[a-z0-9\-.]*(line 1|line 2|line 3|....)!Si
#
# A few notes about this format. It's not necessary to add www to the start of
# hostnames, the regex is designed to match any subdomain. Don't add patterns
# to your file which may run off the end of the URL, e.g. anything containing 
# ".*". Unlike in some similar systems, the line-end metacharacter "$" will not
# assert the end of the hostname, it'll assert the end of the page.
#

# Test blacklist
example\.com

# Spammer URL partials added 2006-10-16
casino-games
adipex
tramadol

# Spammer URL partials added 2006-12-22 because of User 1166728278
dgo5d.info
ringtone

# More spam terms, added 2007-06-10
diazepam
xenical
ringtones
wellbutrin
ativan
viagra
lorazepam
vicodin

# Pages that have been hacked (the spam keywords aren't in the URL, so blacklist isn't effective against the link)
stanford.edu/seminar
sunysb.edu
bc.edu
sc.edu
ku.edu
usc.edu
msoe.edu

# More spammy URLs from 2007-08-17
helmed.info
nobinters.org
davte.info
amohseni.info
psisemiya.com
ashythro.info
kinuia.cn

# More on 2007-08-19
ifrance.com

# 2007-08-22
rigour.info
110mb.com

#2007-08-30
sneck.info
primonona.info
funkall.us
veggis.org
klohy.info
budget7i.info
svike.info
manoke.cn
xionny.cn
wedner.info
soler.net.cn
polex.com.cn

#2008-08-07
chaosantiques.com
travelchinaplanner.com
hkcbn.org
16885.com

 #