#!/bin/sh
# (c) 2001 Ondrej Jombik <nepto@pobox.sk>
# $Id: extract.sh,v 1.1 2002/02/12 00:34:26 jombik9 Exp $
LOG_FILE='mail_action.log';
HTML_SOURCE_FILE='source.tmp.html';
CURRENT_ADDRESSES_FILE='current.tmp.txt';
OUTPUT_FILE='addresses.txt';
GETMAILS_SCRIPT='~/prog/scripts/shell/getmails/getmails.sh';
##############################################################################
if [ $# -lt 1 ]; then
echo "Usage: $0 <first_name>" ;
exit 1;
fi
echo -e "--\nStarting processing name '$1'" >> $LOG_FILE;
lynx -source \
'http://whowhere.lycos.com/srvredirect?Submit=Search&find=email&f-name='"$1" \
> $HTML_SOURCE_FILE;
while [ -r $HTML_SOURCE_FILE ]; do
cat $HTML_SOURCE_FILE \
| $GETMAILS_SCRIPT \
| sort -u \
> $CURRENT_ADDRESSES_FILE;
echo "+ "`cat $CURRENT_ADDRESSES_FILE | wc -l` \
>> $LOG_FILE;
cat $CURRENT_ADDRESSES_FILE >> $OUTPUT_FILE;
query=`cat $HTML_SOURCE_FILE \
| grep 'email.more.wsrch' \
| perl -ne 's/^.*"(http:\/\/[^"]*)".*$/\1/gc; print "$1";'`
#echo "$query";
if [ "" != "$query" ]; then
lynx -source $query > $HTML_SOURCE_FILE;
else
#rm -f $HTML_SOURCE_FILE;
break;
fi;
done
rm -f $CURRENT_ADDRESSES_FILE;
echo -e "Finishing processing name '$1'" >> $LOG_FILE;
Platon Group <platon@platon.sk> http://platon.sk/
|