#----------------------------- |
# download the following standalone program |
#!/usr/bin/perl -w |
# churl - check urls |
use HTML::LinkExtor; |
use LWP::Simple qw ( get head ); |
$base_url = shift |
or die "usage: $0 <start_url>\n" ; |
$parser = HTML::LinkExtor->new ( undef , $base_url ); |
$parser ->parse ( get ( $base_url ) ); |
@links = $parser ->links; |
print "$base_url: \n" ; |
foreach $linkarray ( @links ) |
{ |
my @element = @ $linkarray ; |
my $elt_type = shift @element ; |
while ( @element ) |
{ |
my ( $attr_name , $attr_value ) = splice ( @element , 0, 2 ); |
if ( $attr_value ->scheme =~ /\b ( ftp|https?|file ) \b/ ) |
{ |
print " $attr_value: " , head ( $attr_value ) ? "OK" : "BAD" , "\n" ; |
} |
} |
} |
#----------------------------- |
#% churl http://www.wizards.com |
#http://www.wizards.com: |
# |
# FrontPage/FP_Color.gif: OK |
# |
# FrontPage/FP_BW.gif: BAD |
# |
# #FP_Map: OK |
# |
# Games_Library/Welcome.html: OK |
#----------------------------- |
by: 发表于:2017-09-18 17:48:43 顶(0) | 踩(0) 回复
??
回复评论