| 1 | adcroft | 1.1 | #!/usr/bin/perl -w | 
| 2 |  |  |  | 
| 3 |  |  | foreach $arg (@ARGV) { | 
| 4 |  |  | &spider(0,$arg); | 
| 5 |  |  | #@qq = &scnfle($arg); | 
| 6 |  |  | #print @qq; | 
| 7 |  |  | } | 
| 8 |  |  |  | 
| 9 |  |  | sub scnfle { | 
| 10 |  |  | local($topfile) = $_[0]; | 
| 11 |  |  | local(@listofhrefs) = (); | 
| 12 |  |  |  | 
| 13 |  |  | open(HF,$topfile) || die "Couldn't open $topfile!\n"; | 
| 14 |  |  |  | 
| 15 |  |  | while (<HF>) { | 
| 16 |  |  | if (s/.*href=(["a-zA-Z0-9:\/].*)">.*/$1/) { | 
| 17 |  |  | s/"//g;    # strip out quotes | 
| 18 |  |  | s/>.*//;   # strip of end | 
| 19 |  |  | chop; | 
| 20 |  |  | @listofhrefs=(@listofhrefs,$_) | 
| 21 |  |  | }; | 
| 22 |  |  | } | 
| 23 |  |  | @listofhrefs; | 
| 24 |  |  | } | 
| 25 |  |  |  | 
| 26 |  |  | sub spider { | 
| 27 |  |  | local($thislevel) = $_[0]; | 
| 28 |  |  | local($thisfile) = $_[1]; | 
| 29 |  |  |  | 
| 30 |  |  | if ($thislevel >=2) {return;} | 
| 31 |  |  |  | 
| 32 |  |  | print "spider: level $thislevel, $thisfile\n"; | 
| 33 |  |  | @hrefs=scnfle($thisfile); | 
| 34 |  |  | #print "spider: $thisfile: @hrefs\n"; | 
| 35 |  |  | foreach $href (@hrefs) { | 
| 36 |  |  | if ($href ne $thisfile) { | 
| 37 |  |  | print "$thisfile: -> $href\n"; | 
| 38 |  |  | spider($thislevel+1,$href); | 
| 39 |  |  | } | 
| 40 |  |  | } | 
| 41 |  |  | } |