#!/usr/bin/perl

use LWP::Simple;

# sat3310 - lab05
# created by grgindin@mtu.edu
# 3/10/2026

# Variables
$dataurl = "http://pages.mtu.edu/~toarney/sat3310/lab07/";
$datafile = "fortune500.tsv";
$datapath = "/home/greg/Documents/sat3310/lab05/data/";
# Main



# Get a file - list of websites
getstore($dataurl.$datafile, $datapath.$datafile);
# Parse websites file
open(FILE, "<", $datapath.$datafile);
while ($line = <FILE>) {
    my @website=split("\t",$line);
        push @arrayofurls, $website[2];
}

close FILE;
$|=1;
shift @arrayofurls;
# Start the loop
foreach my $website (@arrayofurls) {
        my $completeurl = "http://".$website;
        my ($type, $length, $modtime, $expiretime, $servertype) = head($completeurl);
        if ($servertype eq "") {$servertype = "Unknown"};
    if (index($servertype, "/") > 0) {
                $servertypesubstring = substr($servertype, 0, index($servertype, "/"));
        }
        else {
                $servertypesubstring = $servertype;
        }
        push (@arrayofservertypes, $servertypesubstring);
        $working++;
        print "Working... $working of $totalsize done.";
        print "\b\b\b\b\b\b\b\b\b\b\b\b\b\b\b\b\b\b\b\b\b\b\b\b\b\b\b\b\b\b\b\b\b";
}
print "\n";
# Sort results

# Count results
# servertype hash (key, value)
# keys are server type names, values are number of times seen

%servertypehash = ();
foreach my $servername (@arrayofservertypes) {
        $servertypehash{$servername}++;
}
# Print results
print "Hash: $servername\t $servertypehash{$servername} \n";

