#! /bin/ksh # Get web links for the genealogy web site # written by John Guest June 20, 1997 files=`ls *.html` # extract http links #for file in "index.html" for file in $files do print "processing $file ..." print "processing $file ..." >>href.log awk ' BEGIN{ FS="\"" } /telnet:/ { for (i=1;i<=NF;i++) { n = index($i,"") n += index($i,"") n += index($i,"
") if ( (substr($i,1,6) == "telnet") && n == 0) { split($i,x," ") print x[1] } } } /gopher:/ { for (i=1;i<=NF;i++) { n = index($i,"") n += index($i,"") n += index($i,"
") if ( substr($i,1,6) == "gopher" && n == 0 ) { split($i,o," ") print o[1] } } } /ftp:/ { for (i=1;i<=NF;i++) { n = index($i,"") n += index($i,"") n += index($i,"
") if ( substr($i,1,3) == "ftp" && n == 0 ) { split($i,o," ") print o[1] } } } /http:/ { for (i=1;i<=NF;i++) { n = index($i,"") n += index($i,"") n += index($i,"
") if ( substr($i,1,4) == "http" && n == 0 ) { split($i,o," ") print o[1] } } }' <$file >>html.list done