#!/usr/bin/perl ##system "wget -O green.html \"http://www.aquatrols.com/tech%20pgs/GH&Nsy%20labels%20&%20MSDSes.htm\""; ##system "wget -O turf.html \"http://www.aquatrols.com/tech%20pgs/turf%20labels%20&%20MSDSes_.htm\""; ##system "cat green.html turf.html > both.html"; open IN, "both.html"; open OUT, ">list1.html"; while() { if(/MSDS/ or /LABEL/) { s/^ *//;s/ *$//; s/href=\"/href=\"http:\/\/www.aquatrols.com\/tech%20pgs\//; /MSDS/ and s/<\//-MSDS<\//; /LABEL/ and s/<\//-Label<\//; />(.{15})/; $lead=$1; s/>/>Aquatrols -/; print OUT "$_"; } } system "sort -u list1.html > list.html";