1 |
|
|
2 |
$out->{fields}->{$_}++ foreach keys %$rec; |
#$out->{ 'fields +' }->{$_}++ foreach keys %$rec; |
3 |
|
|
4 |
$out->{years}->{ $rec->{PY}->[0] }++; |
#$out->{ 'years +' }->{ $rec->{PY}->[0] }++; |
5 |
|
|
6 |
$out->{DT}->{ $_ }++ foreach @{ $rec->{DT} }; |
#$out->{ 'DT +' }->{ $_ }++ foreach @{ $rec->{DT} }; |
7 |
|
|
8 |
|
#$out->{'SC +'}->{ $_ }++ foreach @{ $rec->{SC} }; |
9 |
|
|
10 |
|
# FIXME out of memory without Sack::Digest |
11 |
|
#$out->{'C1 +'}->{ $_ }++ foreach @{ $rec->{C1} }; |
12 |
|
#$out->{'C1#+'}->{ $_ }++ foreach @{ $rec->{C1} }; |
13 |
|
|
14 |
|
|
15 |
|
#$out->{'C1_country+'}->{ m{,\s?([^,]+)\.$} && $1 }++ foreach @{ $rec->{C1} }; |
16 |
|
|
17 |
|
foreach ( @{ $rec->{C1} } ) { |
18 |
|
my $country = $1 if m{,\s?([^,]+)\.$}; |
19 |
|
$country =~ s{^.+USA$}{USA}; |
20 |
|
$country =~ s{^\w\w\s\d{5}$}{USA}; |
21 |
|
$country =~ s{^\w\w$}{USA}; |
22 |
|
# $country =~ s{^([A-Z]+)$}{ucfirst($1)}e; |
23 |
|
$country =~ s{^YUGOS.+}{Yugoslavia}; |
24 |
|
$out->{'C1_country+'}->{ uc $country }++; |
25 |
|
} |
26 |
|
|
27 |
|
|
28 |
|
#$out->{'CR#+'}->{ $_ }++ foreach @{ $rec->{CR} }; |
29 |
|
|
30 |
|
#$out->{'CR+'}->{ $_ }++ foreach @{ $rec->{CR} }; |
31 |
|
|
32 |
|
#$out->{'CR'}->{ $_ }++ foreach @{ $rec->{CR} }; |
33 |
|
|
34 |
|
#my $cr = 1; |
35 |
|
#my $nr = $out->{_debug}->{nr}++; |
36 |
|
#$out->{'CR +'}->{ "$nr." . $cr++ }++ foreach @{ $rec->{CR} }; |
37 |
|
|
38 |
# XXX dump first record |
# XXX dump first record |
39 |
$out->{debug} ||= $rec; |
#$out->{_debug_rec} ||= $rec; |
40 |
|
|
41 |
#push @{ $out->{TI} }, $rec->{TI}; |
#push @{ $out->{TI} }, $rec->{TI}; |
42 |
|
|
43 |
|
#push @{ $out->{_debug}->{id} }, $rec->{'000'}; |
44 |
|
|
45 |
|
if (0) { |
46 |
|
$out->{'_debug'}->{records}++ if $rec; |
47 |
|
$out->{'_debug'}->{start_t} ||= time; |
48 |
|
$out->{'_debug'}->{duration} = time - $out->{'_debug'}->{start_t}; |
49 |
|
} |