1 |
## $Id: StorageInterface.pm,v 1.1 2003/01/20 16:58:46 joko Exp $ |
2 |
## |
3 |
## Copyright (c) 2002 Andreas Motl <andreas.motl@ilo.de> |
4 |
## |
5 |
## See COPYRIGHT section in pod text below for usage and distribution rights. |
6 |
## |
7 |
## ---------------------------------------------------------------------------------------- |
8 |
## $Log: StorageInterface.pm,v $ |
9 |
## ---------------------------------------------------------------------------------------- |
10 |
|
11 |
|
12 |
package Data::Transfer::Sync::Compare::Checksum; |
13 |
|
14 |
use strict; |
15 |
use warnings; |
16 |
|
17 |
use mixin::with qw( Data::Transfer::Sync ); |
18 |
|
19 |
|
20 |
# - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - main |
21 |
|
22 |
use Data::Dumper; |
23 |
use Digest::MD5 qw(md5 md5_hex md5_base64); |
24 |
|
25 |
|
26 |
# get logger instance |
27 |
my $logger = Log::Dispatch::Config->instance; |
28 |
|
29 |
|
30 |
sub _calcChecksum { |
31 |
|
32 |
my $self = shift; |
33 |
my $descent = shift; |
34 |
my $specifier = shift; |
35 |
|
36 |
# calculate checksum for current object |
37 |
my $ident = $self->{node}->{$descent}->{ident}; |
38 |
|
39 |
# build dump of this node |
40 |
my $payload = $self->{node}->{$descent}->{payload}; |
41 |
#my $dump = $ident . "\n" . $item->quickdump(); |
42 |
#my $dump = $ident . "\n" . Dumper($item); |
43 |
my $dump = $ident . "\n" . $self->_dumpCompact($payload); |
44 |
|
45 |
# TODO: $logger->dump( ... ); |
46 |
#$logger->debug( __PACKAGE__ . ": " . $dump ); |
47 |
#$logger->dump( __PACKAGE__ . ": " . $dump ); |
48 |
|
49 |
# calculate checksum from dump |
50 |
# note: the 32-bit integer hash from DBI seems |
51 |
# to generate duplicates with small payloads already in ranges of hundreds of items/rows!!! |
52 |
# try to avoid to use it or try to use it only for payloads greater than, hmmm, let's say 30 chars? |
53 |
# (we had about 15 chars average per item (row)) |
54 |
|
55 |
# md5-based fingerprint, base64 encoded (from Digest::MD5) |
56 |
$self->{node}->{$descent}->{checksum} = md5_base64($dump) . '=='; |
57 |
# 32-bit integer "hash" value (maybe faster?) (from DBI) |
58 |
#$self->{node}->{$descent}->{checksum} = DBI::hash($dump, 1); |
59 |
|
60 |
# signal good |
61 |
return 1; |
62 |
|
63 |
} |
64 |
|
65 |
|
66 |
sub _readChecksum { |
67 |
my $self = shift; |
68 |
|
69 |
my $descent = shift; |
70 |
|
71 |
# signal checksum bad |
72 |
if (!$self->{node}->{$descent}) { |
73 |
return; |
74 |
} |
75 |
|
76 |
# trace |
77 |
#print "desc: $descent", "\n"; |
78 |
#print Dumper($self); |
79 |
#exit; |
80 |
|
81 |
# get checksum for current entry |
82 |
# TODO: don't have the checksum column/property hardcoded as "cs" here, make this configurable somehow |
83 |
if ($self->{options}->{$descent}->{storage}->{isChecksumAuthority}) { |
84 |
$self->_calcChecksum($descent); |
85 |
} else { |
86 |
$self->{node}->{$descent}->{checksum} = $self->{node}->{$descent}->{payload}->{cs}; |
87 |
} |
88 |
|
89 |
# signal checksum good |
90 |
return 1; |
91 |
|
92 |
} |
93 |
|
94 |
|
95 |
1; |