summaryrefslogtreecommitdiff
path: root/scripts/stats/clean.sh
diff options
context:
space:
mode:
authorPaul Buetow <paul@buetow.org>2011-03-06 10:57:41 +0000
committerPaul Buetow <paul@buetow.org>2011-03-06 10:57:41 +0000
commit213033db33be271791f2d9ff1c9c44c0bed79f18 (patch)
tree1b3ff0d0eddfc7f6995afa67b5d3fc2ef8fa85a7 /scripts/stats/clean.sh
initial xerl import to utils
Diffstat (limited to 'scripts/stats/clean.sh')
-rwxr-xr-xscripts/stats/clean.sh49
1 files changed, 49 insertions, 0 deletions
diff --git a/scripts/stats/clean.sh b/scripts/stats/clean.sh
new file mode 100755
index 0000000..ba0f0e8
--- /dev/null
+++ b/scripts/stats/clean.sh
@@ -0,0 +1,49 @@
+#!/bin/sh
+
+# 2006 - 2008 The Xerl Project
+
+for log in *.log
+do
+ re=''
+ for remove in \
+ Charlotte \
+ Exabot \
+ Mnogo \
+ Netcraft \
+ Perl \
+ Python \
+ SurveyBot \
+ VoilaBot \
+ Yandex \
+ Yeti \
+ ajSitemap \
+ archiver \
+ crawler \
+ feed \
+ findlinks \
+ fulltext \
+ googlebot \
+ grabber \
+ jeeves \
+ msnbot \
+ pear \
+ pingdom \
+ rss2 \
+ sagool \
+ sbider \
+ slurp \
+ spider \
+ tagsdir \
+ validator \
+ walhello \
+ ;do
+ if [ -z "$re" ]
+ then
+ re="($remove)"
+ else
+ re="$re|($remove)"
+ fi
+ done
+ grep -E -i -v "$re" $log > $log.new
+ mv -f $log.new $log
+done