-
Notifications
You must be signed in to change notification settings - Fork 0
/
grabFeedback.pl
77 lines (56 loc) · 1.69 KB
/
grabFeedback.pl
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
#!/usr/bin/perl -w
# Example code from Chapter 1 of /Perl and LWP/ by Sean M. Burke
# http://www.oreilly.com/catalog/perllwp/
#require 5;
use strict;
use warnings;
if (scalar(@ARGV) != 1) {
print "Usage: grabFeedback.pl StateFolder\n";
exit;
}
my $stateFolder = $ARGV[0];
use LWP::Simple;
my $i;
my $myURL;
my $filename;
my $foldername;
for ($i = 'A'; $i ne 'AA'; $i++) {
$foldername = "$stateFolder/ratings/$i";
# Read all files in folder.
opendir(DIR, $foldername);
my @files = grep(/\.htm$/,readdir(DIR));
closedir(DIR);
foreach $filename (@files) {
#print "Checking file $foldername/$filename\n";
open(INPUT, "<$foldername/$filename");
my @lines = <INPUT>;
close(INPUT);
# Read all the lines from file $filename, then get each feedback found therein.
my $j;
for ($j = 0; $j < scalar(@lines); $j++) {
if ($lines[$j] =~ m/href="\/(social[^" ]*).*Read this rating's feedback/) {
my $originalURL = $1;
my $id;
if ($originalURL =~ m/social\/\?q=node\/(\d+)/) {
$id = $1;
} else { print "DISASTER id-processing $originalURL"; exit(3); }
my $outfilename = "$stateFolder/ratings/feedback/feedback$id.htm";
if (-e $outfilename) {
print "Skipped $outfilename\n";
} else {
open(FO, ">" . $outfilename) or die "Cannot open file $outfilename";
my $myUrl = "http://www.ratemds.com/$originalURL";
my $content = get($myUrl);
print FO $content;
print "Wrote $myUrl to $outfilename\n";
close(FO);
sleep 10;
}
}
}
}
#sleep 5;
}
print "done! Ta Da \n";
__END__