contrib/phishing/update_iana_data.sh
121c75e1
 #
 #  Phishing detection automated testing & tools.
 #  Copyright (C) 2006 Torok Edvin <edwintorok@gmail.com>
 #
 #  This program is free software; you can redistribute it and/or modify
 #  it under the terms of the GNU General Public License as published by
 #  the Free Software Foundation; either version 2 of the License, or
 #  (at your option) any later version.
 #
 #  This program is distributed in the hope that it will be useful,
 #  but WITHOUT ANY WARRANTY; without even the implied warranty of
 #  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 #  GNU General Public License for more details.
 #
 #  You should have received a copy of the GNU General Public License
 #  along with this program; if not, write to the Free Software
 #  Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston,
 #  MA 02110-1301, USA.
 #
4ce98744
 #!/bin/sh
 IANA_TLD="http://data.iana.org/TLD/tlds-alpha-by-domain.txt"
 IANA_CCTLD="http://www.iana.org/cctld/cctld-whois.htm";
 TMP=`tempfile`
 OUTFILE=iana_tld.h
 
 echo "Downloading updated tld list from iana.org"
 wget $IANA_TLD -O $TMP || exit 2
 echo "Download complete, parsing data"
 # 174 is the code for |
 TLDLIST=$(egrep -v ^# $TMP | tr \\n \\174 | sed 's/[^a-zA-Z]$//')
 echo "Parse complete, removing tmpfile"
 rm $TMP
 echo "Generating tld list in $OUTFILE"
 cat >$OUTFILE <<EOF
 #ifndef IANA_TLD_H
 #define IANA_TLD_H
 EOF
 echo -n "#define iana_tld \"(" >>$OUTFILE
 echo -n $TLDLIST >>$OUTFILE
 echo ")\"" >>$OUTFILE
 
 echo "Downloading updated country-code list from iana.org"
 wget $IANA_CCTLD -O $TMP || exit 2
 echo "Download complete, parsing data"
 CCTLDLIST=$(cat $TMP | egrep -oi "<a href=[^>]+>\\.([a-z]+).+</a>" | egrep -o ">.[a-z]+" | colrm 1 2 | tr \\n \\174 | sed 's/[^a-zA-Z]$//')
 echo "Parse complete, removing tmpfile"
 rm $TMP
 echo "Generating cctld list in $OUTFILE"
 echo -n "#define iana_cctld \"(" >>$OUTFILE
 echo -n $CCTLDLIST >>$OUTFILE
 echo ")\"" >>$OUTFILE
 
 
 echo "#endif" >>$OUTFILE
 echo "Finished succesfully"