Author: hstern
Date: Mon Aug 9 10:47:08 2004
New Revision: 36121
Modified:
spamassassin/trunk/masses/runGA
Log:
* runGA
Saved the training and test sets, as per Justin's request.
Modified: spamassassin/trunk/masses/runGA
==============================================================================
--- spamassassin/trunk/masses/runGA (original)
+++ spamassassin/trunk/masses/runGA Mon Aug 9 10:47:08 2004
@@ -33,27 +33,27 @@
# Generate 90/10 split logs
echo "[Generating 90/10 split ham]"
-mkdir NSBASE SPBASE
-cd NSBASE
-../tenpass/split-log-into-buckets-random 10 < ../ORIG/ham-$NAME.log > /dev/null
+mkdir $LOGDIR/NSBASE $LOGDIR/SPBASE
+cd $LOGDIR/NSBASE
+../../tenpass/split-log-into-buckets-random 10 < ../../ORIG/ham-$NAME.log > /dev/null
cat split-[1-9].log > ham.log
rm -f split-[1-9].log
mv split-10.log ham-test.log
echo "[Generating 90/10 split spam]"
cd ../SPBASE
-../tenpass/split-log-into-buckets-random 10 < ../ORIG/spam-$NAME.log > /dev/null
+../../tenpass/split-log-into-buckets-random 10 < ../../ORIG/spam-$NAME.log > /dev/null
cat split-[1-9].log > spam.log
rm -f split-[1-9].log
mv split-10.log spam-test.log
-cd ..
+cd ../..
echo "[Setting up for gen run]"
# Ok, setup for a run
-ln -s SPBASE/spam.log .
-ln -s NSBASE/ham.log .
-ln -s SPBASE/spam-test.log .
-ln -s NSBASE/ham-test.log .
+ln -s $LOGDIR/SPBASE/spam.log .
+ln -s $LOGDIR/NSBASE/ham.log .
+ln -s $LOGDIR/SPBASE/spam-test.log .
+ln -s $LOGDIR/NSBASE/ham-test.log .
# try to find number of processors
numcpus=`cpucount 2>/dev/null || egrep -c '^processor\b' /proc/cpuinfo 2>/dev/null || echo 1`
@@ -81,8 +81,8 @@
# This needs to have 50_scores.cf in place first ...
echo "[gen test results]"
-./logs-to-c --spam=SPBASE/spam-test.log \
- --ham=NSBASE/ham-test.log \
+./logs-to-c --spam=spam-test.log \
+ --ham=ham-test.log \
--count --cffile=../rules --scoreset=$SCORESET | tee $LOGDIR/test
echo "[STATISTICS file generation]"
Date: Mon Aug 9 10:47:08 2004
New Revision: 36121
Modified:
spamassassin/trunk/masses/runGA
Log:
* runGA
Saved the training and test sets, as per Justin's request.
Modified: spamassassin/trunk/masses/runGA
==============================================================================
--- spamassassin/trunk/masses/runGA (original)
+++ spamassassin/trunk/masses/runGA Mon Aug 9 10:47:08 2004
@@ -33,27 +33,27 @@
# Generate 90/10 split logs
echo "[Generating 90/10 split ham]"
-mkdir NSBASE SPBASE
-cd NSBASE
-../tenpass/split-log-into-buckets-random 10 < ../ORIG/ham-$NAME.log > /dev/null
+mkdir $LOGDIR/NSBASE $LOGDIR/SPBASE
+cd $LOGDIR/NSBASE
+../../tenpass/split-log-into-buckets-random 10 < ../../ORIG/ham-$NAME.log > /dev/null
cat split-[1-9].log > ham.log
rm -f split-[1-9].log
mv split-10.log ham-test.log
echo "[Generating 90/10 split spam]"
cd ../SPBASE
-../tenpass/split-log-into-buckets-random 10 < ../ORIG/spam-$NAME.log > /dev/null
+../../tenpass/split-log-into-buckets-random 10 < ../../ORIG/spam-$NAME.log > /dev/null
cat split-[1-9].log > spam.log
rm -f split-[1-9].log
mv split-10.log spam-test.log
-cd ..
+cd ../..
echo "[Setting up for gen run]"
# Ok, setup for a run
-ln -s SPBASE/spam.log .
-ln -s NSBASE/ham.log .
-ln -s SPBASE/spam-test.log .
-ln -s NSBASE/ham-test.log .
+ln -s $LOGDIR/SPBASE/spam.log .
+ln -s $LOGDIR/NSBASE/ham.log .
+ln -s $LOGDIR/SPBASE/spam-test.log .
+ln -s $LOGDIR/NSBASE/ham-test.log .
# try to find number of processors
numcpus=`cpucount 2>/dev/null || egrep -c '^processor\b' /proc/cpuinfo 2>/dev/null || echo 1`
@@ -81,8 +81,8 @@
# This needs to have 50_scores.cf in place first ...
echo "[gen test results]"
-./logs-to-c --spam=SPBASE/spam-test.log \
- --ham=NSBASE/ham-test.log \
+./logs-to-c --spam=spam-test.log \
+ --ham=ham-test.log \
--count --cffile=../rules --scoreset=$SCORESET | tee $LOGDIR/test
echo "[STATISTICS file generation]"