# time out (seconds) $timeout = 60; # delay time (minites) $delay = 0.5; # the mail address of the human responsible for the robot $email_adr = 'you@yourdomain'; # start URL @start_urls = ( 'http://aaa.intranet.ne.jp/', 'http://bbb.intranet.ne.jp/', 'http://ccc.intranet.ne.jp/~user1/' ); # number of resources $count = 10; # fetch allow pattern @fetch_allow = ( '^http://.*\.intranet.ne.jp/.*\.html$', '^http://.*\.intranet.ne.jp/.*\.htm$', '^http://.*\.intranet.ne.jp/.*\.txt$', '^http://.*\.intranet.ne.jp/.*/$', '^http://.*\.intranet.ne.jp/$', '^http://.*\.intranet.ne.jp$', '^file:///home/search/work/download/.*html$', '^file:///home/search/work/download/.*htm$', '^file:///home/search/work/download/.*txt$', '^file:///home/search/work/download/.*/$' ); # fetch deny pattern @fetch_deny = ( '/\/jdk[\d\.]+/' ); # save allow pattern @save_allow = ( '^http://.*\.intranet.ne.jp/.*\.html$', '^http://.*\.intranet.ne.jp/.*\.htm$', '^http://.*\.intranet.ne.jp/.*\.txt$', '^http://.*\.intranet.ne.jp/.*/$', '^http://.*\.intranet.ne.jp/$', '^http://.*\.intranet.ne.jp$' ); #translate pattern %tran_pat = ( 'file:///home/search/work/download/', 'http://' ); # database name $dbname = 'search'; # download directory $downdir = "download"; # default file name when file name is not given $defaultfname = "_default"; 1;