pricecharts

track prices of consumer electronics
Log | Files | Refs | README

commit 440364db6fb93516c5dc4ea4c3126a0d9da472c3
parent dca4c452e2326021886fae47ee2cdf3b4ced8d70
Author: Kyle Milz <kyle@getaddrinfo.net>
Date:   Sun, 12 Oct 2014 23:01:54 -0600

product_scraper: change accounting of new products

Diffstat:
Mproduct_scraper.pl | 13+++++++------
1 file changed, 7 insertions(+), 6 deletions(-)

diff --git a/product_scraper.pl b/product_scraper.pl @@ -43,13 +43,13 @@ my %product_map = ("televisions" => "Televisions", my $email; $email .= "*** Memory Express ***\n\n"; -$email .= "product type scraped total new\n"; +$email .= "type scraped total new\n"; $email .= "------------ ------- ----- ---\n"; my @new = (); for (keys %product_map) { - $email .= sprintf("%-15s ", "$_:"); + $email .= sprintf("%-15s ", $_); my $class_url = "http://www.memoryexpress.com/Category/" . "$product_map{$_}?PageSize=120&Page="; @@ -74,7 +74,8 @@ for (keys %product_map) { push @results, $dom->find(".PIV_Regular")->html_array(); } - my $scraped = 0; + my $new = 0; + my $old = 0; for my $node (@results) { my $product = HTML::Grabber->new(html => $node); @@ -110,6 +111,7 @@ for (keys %product_map) { $dbh->do("update products set last_seen = ? where part_num = ?", undef, time, $part_num); # also update title, brand here? + $old++; } else { $dbh->do("insert into products(part_num, brand, title," . @@ -119,14 +121,13 @@ for (keys %product_map) { #$dbh->do("create table [$part_num]" . # "(unix_time int not null primary key)"); push @new, ([$_, $brand, $title, $part_num]); + $new++; } - $scraped++; last; } - $email .= sprintf("%7s %5s %3s\n", $scraped, scalar @results, - scalar @new); + $email .= sprintf("%7s %5s %3s\n", $new + $old, scalar @results, $new); next; }