#!/bin/bash rm -f 404.txt rm -f log.txt if [ $1 = "1" ]; then webbot -q -depth 2 -prefix http://www.masseyratings.com -exclude "team.php" -referer log.txt http://www.masseyratings.com/rate/nhl-p.htm fi # final outputfile contains both broken links, and good links (which are prefixed by ::::) if [ $1 = "2" ]; then webbot -q -depth 12 -prefix "http://www" -include "hollins.edu" -exclude "cal_make|postings.cgi" -check "\.doc$|\.pdf$|\.zip$|\.xls$|\.ppt$|\.mov$|\.JPG$" -404 404.txt -referer log.txt http://www1.hollins.edu/ cat 404.txt > hollins.txt grep "::::" log.txt >> hollins.txt fi