File:  [Public] / libwww / Robot / src / robot.sh
Revision 1.2: download - view: text, annotated - select for diffs
Sat Feb 7 23:59:39 1998 UTC (26 years, 4 months ago) by frystyk
Branches: MAIN
CVS tags: Release-5-1l, Release-5-1k, Release-5-1j, HEAD
*** empty log message ***

#!/bin/sh
if [ $# -lt 3 ]
then
	echo "A simple example of how the libwww robot can be used"
	echo "For a full description, see"
	echo
	echo "        http://www.w3.org/Robot/User/CommandLine.html"
	echo
	echo "Usage:	$0 RootURI ImageRootURI LogPrefix [ flags ]"
	echo
        echo "where"
	echo "        RootURI       is the URI prefix for links, for example http://www.w3.org/Robot/"
	echo "        ImageRootURI  is the URI prefix for inlined images, for example http://www.w3.org"
	echo "        LogPrefix     is the prefix for log files, for example robot"
	echo "        flags         are any additional command line flags, for example -vp"
	echo
	echo "See"
	echo "        http://www.w3.org/Robot/"
	echo
	echo "for more information"
	exit 1
fi

ROOT=$1
IMGROOT=$2
LOG=$3
FLAGS=$4

ROBOT=/home/frystyk/w3c-lib/Robot/src/webbot

${ROBOT} ${FLAGS} -q -ss -n -depth 99 \
-exclude "/ArchiveBrowser/|/History/|/member/|/team/" \
-check "\.gz$|\.Z$|\.zip$|\.ZIP$|\.tar$|\.ps$|\.doc$|\.pdf$|\.xplot$|\.java$|\.c$|\.h$|\.txt$|\.ppt$|\.gif$|\.GIF$|\.tiff$|\.png$|\.PNG$|\.jpeg$|\.jpg$|\.JPE$" \
-prefix ${ROOT} \
-img -imgprefix ${IMGROOT} \
-l ${LOG}-log-clf.txt \
-alt ${LOG}-log-alt.txt \
-hit ${LOG}-log-hit.txt \
-rellog ${LOG}-log-link-relations.txt -relation stylesheet \
-lm ${LOG}-log-lastmodified.txt \
-title ${LOG}-log-title.txt \
-referer ${LOG}-log-referer.txt \
-negotiated ${LOG}-log-negotiated.txt \
-404 ${LOG}-log-notfound.txt \
-reject ${LOG}-log-reject.txt \
-format ${LOG}-log-format.txt \
-charset ${LOG}-log-charset.txt \
${ROOT} 

Webmaster