¥Õ¥¡¥¤¥ë¤Ë´Þ¤Þ¤ì¤ëʸ»ú¿ô¤ò¿ô¤¨¤ë
use File::Find;
@ARGV=qw(.)unless@ARGV;
find sub{push@list,$File::Find::name,-d&&'/',"\n"},@ARGV;
chomp@list;
foreach(@list){
unless($_){next;}
if(/^\//){next;}
if(/htm$|html$/){
$HtmlCount++;
system("nkf -w $_ > $TmpFile");
$w3m=`w3m-dump$TmpFile`;
$w3m_length = length $w3m;
$HtmlLength += length $w3m;
}
@dot=split(/\./,$_);
$FileType{$dot[@dot-1]}++;
$AllCount++;
}
@FileType=sort{$FileType{$b}<=>$FileType{$a}}keys%FileType;
for($i=0;$i<@FileType;$i++){
print"$i$FileType[$i]$FileType{$FileType[$i]}\n";
}
print"All$AllCount\n";
print"HtmlÁíʸ»ú¿ôUTF8length$HtmlLength¥Õ¥¡¥¤¥ë¿ô$HtmlCount\n";
$AveLength=$HtmlLength/$HtmlCount;
print"HTMLÊ¿¶Ñʸ»ú¿ô(UTF8¤Ê¤Î¤Ç3¥Ð¥¤¥È)$AveLength\n";
$AveLength3=$HtmlLength/$HtmlCount/3;
print"HTMLÊ¿¶Ñʸ»ú¿ô$AveLength3\n";