projects
/
migration-tools.git
/ commitdiff
commit
grep
author
committer
pickaxe
?
search:
re
summary
|
shortlog
|
log
|
commit
| commitdiff |
tree
raw
|
patch
(parent:
e64cecf
)
compress: more reporting
author
Shawn Boyette
<sboyette@esilibrary.com>
Mon, 8 Dec 2008 22:27:53 +0000 (22:27 +0000)
committer
Shawn Boyette
<sboyette@esilibrary.com>
Mon, 8 Dec 2008 22:27:53 +0000 (22:27 +0000)
compress_fingerprints
patch
|
blob
|
history
diff --git
a/compress_fingerprints
b/compress_fingerprints
index
44abf94
..
377a517
100755
(executable)
--- a/
compress_fingerprints
+++ b/
compress_fingerprints
@@
-15,13
+15,17
@@
my %recs = (); # fingerprints belonging to each record
open FP, '<', $ARGV[0] or die "Can't open input file: $!\n";
my $count = 0;
+my $i = 0;
my $total = `wc -l $ARGV[0]`;
+$| = 1;
print "Loading and ranking fingerprints\n";
while (<FP>) {
my @fields = split "\t", $_;
my $fp = populate_fingerprint(@fields);
rank_fingerprint($fp);
+ $i++;
+ print "\r", ( int($i / $total) ), "% complete" unless ($i % 1000);
}
print "$total fingerprints processed\n";
print "$count records set as leads\n";