4 |
use strict; |
use strict; |
5 |
|
|
6 |
use WWW::Mechanize; |
use WWW::Mechanize; |
7 |
|
use MARC::Record; |
8 |
|
|
9 |
|
binmode STDOUT, ':utf8'; |
10 |
|
|
11 |
|
my $cobiss_marc21 = { |
12 |
|
'010' => { a => [ '020', 'a' ] }, |
13 |
|
200 => { |
14 |
|
a => [ 245 , 'a' ], |
15 |
|
f => [ 245 , 'f' ], |
16 |
|
}, |
17 |
|
205 => { a => [ 250 , 'a' ] }, |
18 |
|
210 => { |
19 |
|
a => [ 250 , 'a' ], |
20 |
|
c => [ 260 , 'b' ], |
21 |
|
d => [ 260 , 'c' ], |
22 |
|
}, |
23 |
|
215 => { |
24 |
|
a => [ 300 , 'a' ], |
25 |
|
c => [ 300 , 'b' ], |
26 |
|
d => [ 300 , 'c' ], |
27 |
|
}, |
28 |
|
700 => { |
29 |
|
a => [ 100 , 'a' ], |
30 |
|
}, |
31 |
|
}; |
32 |
|
|
33 |
sub search { |
sub search { |
34 |
|
|
71 |
if ( $mech->content =~ m{<pre>\s*(.+1\..+?)\s*</pre>}s ) { |
if ( $mech->content =~ m{<pre>\s*(.+1\..+?)\s*</pre>}s ) { |
72 |
my $comarc = $1; |
my $comarc = $1; |
73 |
$comarc =~ s{</?b>}{}gs; |
$comarc =~ s{</?b>}{}gs; |
74 |
$comarc =~ s{<(/?font)[^>]*>}{<sf>}gs; |
$comarc =~ s{<font[^>]*>}{<s>}gs; |
75 |
|
$comarc =~ s{</font>}{<e>}gs; |
76 |
|
|
77 |
print $comarc; |
print $comarc; |
78 |
|
|
79 |
|
my $marc = MARC::Record->new; |
80 |
|
|
81 |
|
foreach my $line ( split(/[\r\n]+/, $comarc) ) { |
82 |
|
our @f; |
83 |
|
|
84 |
|
if ( $line !~ s{(\d\d\d)([01 ])([01 ])}{} ) { |
85 |
|
warn "SKIP: $line\n"; |
86 |
|
} else { |
87 |
|
$line .= "<eol>"; |
88 |
|
|
89 |
|
@f = ( $1, $2, $3 ); |
90 |
|
sub sf { warn "sf",@_,"|",@f; push @f, @_; } |
91 |
|
$line =~ s{<s>(\w)<e>([^<]+)\s*}{sf($1, $2)}ges; |
92 |
|
warn "# f:", join(' ', @f), " left:|$line|\n"; |
93 |
|
$marc->add_fields( @f ); |
94 |
|
} |
95 |
|
} |
96 |
|
|
97 |
|
open(my $out, '>:utf8', 'out.marc'); |
98 |
|
print $out $marc->as_usmarc; |
99 |
|
close($out); |
100 |
|
|
101 |
|
warn $marc->as_formatted; |
102 |
|
|
103 |
return $comarc; |
return $comarc; |
104 |
} else { |
} else { |
105 |
die "can't fetch COMARC format from ", $mech->content; |
die "can't fetch COMARC format from ", $mech->content; |