#!/usr/bin/perl # GETTER.PL #Sample Logfile Format #68.85.201.140 - - [14/Nov/2005:10:58:34 -0500] "GET /staff.swf HTTP/1.1" 404 # getter reads a logfile and gets missing file from another website. # Used in cloning a website that # can not be gotten via wget. like Flash websites. # - By Mike of GeekLabs.com mikeh@geeklabs.com ego-ware, like it? Send me a thank you! #---------- #run this by running "tail -f logfile | grep getter #and then go surf the website that you grabbed with wget #but are missing pieces of because of weird links in flash or javascript $source = "http://www.originalwebsite.???" ; while() { @d = split(/\s+/) ; print "$d[6] - $d[8]\n" ; if("$d[8]" eq "200") { #do nothing for now } else { $string = "wget -nH $source$d[6]" ; print "$string\n" ; system("$string") ; } ; } ;