28 |
print S $common::mps_header; |
print S $common::mps_header; |
29 |
print MPS $common::mps_header; |
print MPS $common::mps_header; |
30 |
|
|
31 |
|
#-------------------------------------------------------------------- |
32 |
|
# init array in_mps_header for config checks later |
33 |
|
|
34 |
|
my %in_mps_header; |
35 |
|
foreach (split(/\n/,$common::mps_header)) { |
36 |
|
if (/^F /) { |
37 |
|
my (undef,$isis,$mps,undef) = split(/ /,$_,4); |
38 |
|
$in_mps_header{$mps}=$isis; |
39 |
|
} |
40 |
|
} |
41 |
|
require "./search/config.pm"; |
42 |
|
|
43 |
|
#-------------------------------------------------------------------- |
44 |
|
# read database configuration, store database names |
45 |
|
open(CF,$common::database_cf) || die "$common::database_cf: $!"; |
46 |
|
my %DatabaseDescriptions; |
47 |
|
while(<CF>) { |
48 |
|
chomp; |
49 |
|
if (/^database-name:([^=]+)=(.*)$/) { |
50 |
|
my ($db_name,$db_desc) = ($1,$2); |
51 |
|
$db_desc=~s/^##\w+##//g; |
52 |
|
$DatabaseDescriptions{$db_name}=$db_desc; |
53 |
|
} |
54 |
|
} |
55 |
|
close(CF); |
56 |
|
|
57 |
|
#-------------------------------------------------------------------- |
58 |
# |
# |
59 |
# expand(nr,"space separated string"); |
# expand(nr,"space separated string"); |
60 |
# |
# |
61 |
|
|
62 |
sub expand { |
sub expand { |
63 |
my $nr = shift @_; |
my $nr = shift @_; |
64 |
|
die "$nr is not in mps_header" if (!$in_mps_header{$nr}); |
65 |
my $out = ""; |
my $out = ""; |
66 |
while (my $fld = c_852_iso(shift @_)) { |
while (my $fld = c_852_iso(shift @_)) { |
67 |
my @words=split(/\s+/,$fld); |
my @words=split(/\s+/,$fld); |
78 |
|
|
79 |
#-------------------------------------------------------------------- |
#-------------------------------------------------------------------- |
80 |
|
|
|
################### ERASE###############3 |
|
|
|
|
|
# expand sub-fileds from ISIS field |
|
|
# (^a.....^b....) |
|
|
my %data; # FIX |
|
|
sub ex_sf { |
|
|
%data = (); |
|
|
my $in = $_[0]; |
|
|
if (my $tmp = $in) { |
|
|
# $tmp =~ tr/џ/ƾ/; # ISIS -> iso-8859-2 |
|
|
$tmp =~ tr//ܫꔼȺ̪㍐슂ٝ/; |
|
|
if ($in =~ m/^\^/) { |
|
|
my @sub = split(/\^/,$in); |
|
|
foreach my $fld (@sub) { |
|
|
$data{$1} = $2 if ($fld =~ m/^(\w+)(.+)$/) |
|
|
} |
|
|
} else { |
|
|
$data{all} = $in."<-- iz polja bez podpolja"; |
|
|
} |
|
|
} |
|
|
} |
|
|
|
|
|
# dump all sub-fields |
|
|
sub all_sf { |
|
|
my $nr = shift @_; |
|
|
my $out=""; |
|
|
foreach my $k (sort keys %data) { |
|
|
$out.=expand($nr,$data{$k}); |
|
|
} |
|
|
return $out; |
|
|
} |
|
|
|
|
|
sub all_sf_r { |
|
|
my $nr = shift @_; |
|
|
my $out=""; |
|
|
foreach my $k (sort {$b cmp $a} keys %data) { |
|
|
$out.=expand($nr,$data{$k}); |
|
|
} |
|
|
return $out; |
|
|
} |
|
|
|
|
|
sub all_sf2bib { |
|
|
my $nr = shift @_; |
|
|
my $max_in_line=shift @_ || 0; |
|
|
my $sep = shift @_ || ' '; |
|
|
my $out; |
|
|
my $i=0; |
|
|
my $bib = ""; |
|
|
foreach my $k (sort keys %data) { |
|
|
if ($out) { |
|
|
$out.= $sep.$data{$k}; |
|
|
} else { |
|
|
$out = $data{$k}; |
|
|
} |
|
|
$i++; |
|
|
if ($i == $max_in_line) { |
|
|
$bib .= $nr." ".$out."\n" if ($out); |
|
|
$i=0; |
|
|
$out=""; |
|
|
} |
|
|
} |
|
|
$bib .= $nr." ".$out."\n" if ($out); |
|
|
return $bib; |
|
|
} |
|
|
|
|
|
sub all_sf2bib_r { |
|
|
my $nr = shift @_; |
|
|
my $max_in_line=shift @_ || 0; |
|
|
my $sep = shift @_ || ' '; |
|
|
my $out; |
|
|
my $i=0; |
|
|
my $bib = ""; |
|
|
foreach my $k (sort {$b cmp $a} keys %data) { |
|
|
if ($out) { |
|
|
$out.= $sep.$data{$k}; |
|
|
} else { |
|
|
$out = $data{$k}; |
|
|
} |
|
|
$i++; |
|
|
if ($i == $max_in_line) { |
|
|
$bib .= $nr." ".$out."\n" if ($out); |
|
|
$i=0; |
|
|
$out=""; |
|
|
} |
|
|
} |
|
|
$bib .= $nr." ".$out."\n" if ($out); |
|
|
return $bib; |
|
|
} |
|
|
|
|
|
#-------------------------------------------------------------------- |
|
|
|
|
81 |
sub c_852_iso { |
sub c_852_iso { |
82 |
my $tmp = $_[0]; |
my $tmp = $_[0]; |
83 |
$tmp =~ tr//ܫꔼȺ̪㍐슂ٝ/ if ($tmp); |
$tmp =~ tr//ܫꔼȺ̪㍐슂ٝ/ if ($tmp); |
94 |
|
|
95 |
#-------------------------------------------------------------------- |
#-------------------------------------------------------------------- |
96 |
|
|
97 |
# $mps .= sf_to_mps($subfiled_hash,"subfields",mps_id); |
# $mps .= sf_to_mps("subfields",$subfiled_hash) |
98 |
# |
# |
99 |
# subfields options: |
# subfields options: |
100 |
# * - all (no sort) |
# * - all (no sort) |
125 |
|
|
126 |
sub sf_to_mps { |
sub sf_to_mps { |
127 |
my ($sf_hash,$subfields,$mps_id) = @_; |
my ($sf_hash,$subfields,$mps_id) = @_; |
128 |
|
die "$mps_id is not in mps_header" if (!$in_mps_header{$mps_id}); |
129 |
my $out=""; |
my $out=""; |
130 |
my @sf_arr = subfields_str_2_arr($subfields,$sf_hash); |
my @sf_arr = subfields_str_2_arr($subfields,$sf_hash); |
131 |
|
|
145 |
my $mps_id = shift @_ || die; |
my $mps_id = shift @_ || die; |
146 |
my $subfields = shift @_; |
my $subfields = shift @_; |
147 |
|
|
148 |
|
die "$mps_id is not in mps_header" if (!$in_mps_header{$mps_id}); |
149 |
|
|
150 |
my $i=0; |
my $i=0; |
151 |
my $out = ""; |
my $out = ""; |
152 |
|
|
190 |
my $group_sort = shift @_ || ''; |
my $group_sort = shift @_ || ''; |
191 |
my $sep = shift @_ || ' '; |
my $sep = shift @_ || ' '; |
192 |
|
|
193 |
|
my $fld = $bib_id; $fld =~ s/^%//; |
194 |
|
die "$fld is not in FieldNames" if (!$default::FieldNames{$fld}); |
195 |
|
|
196 |
my $i=0; |
my $i=0; |
197 |
|
|
198 |
my $bib=""; |
my $bib=""; |
285 |
} |
} |
286 |
|
|
287 |
#-------------------------------------------------------------------- |
#-------------------------------------------------------------------- |
|
#-------------------------------------------------------------------- |
|
|
|
|
288 |
|
|
289 |
my $last_tell=0; |
my $last_tell=0; |
290 |
|
|
329 |
} |
} |
330 |
|
|
331 |
my $headline; |
my $headline; |
332 |
$headline .= isis_sf($row,'200','a',"'"); |
$headline .= isis_sf($row,'200','a'); |
333 |
$headline .= isis_sf($row,'200','e'," : ","'"); |
$headline .= isis_sf($row,'200','e'," : "); |
334 |
|
$headline .= isis_sf($row,'200','f'," / "); |
335 |
|
$headline .= isis_sf($row,'210','d'," , "); |
336 |
|
|
337 |
# author |
# author |
338 |
$bib .= isis_to_bib($row,'700','%700+','*',2,'<'); |
$bib .= isis_to_bib($row,'700','%700+','*',2,'<'); |
363 |
$book .= ". ".$sf->{c} if ($sf->{c}); |
$book .= ". ".$sf->{c} if ($sf->{c}); |
364 |
$book .= " / ".$sf->{x} if ($sf->{x}); |
$book .= " / ".$sf->{x} if ($sf->{x}); |
365 |
$book .= " ; ".$sf->{y} if ($sf->{y}); |
$book .= " ; ".$sf->{y} if ($sf->{y}); |
366 |
$bib .= "%200 $book\n" if ($book); |
$bib .= "%200+ $book\n" if ($book); |
367 |
|
|
368 |
$mps .= isis_to_mps($row,'200',2,"akcde"); |
$mps .= isis_to_mps($row,'200',2,"akcde"); |
369 |
$mps .= isis_to_mps($row,'532',2); |
$mps .= isis_to_mps($row,'532',2); |
375 |
$mps .= isis_to_mps($row,'233',2,"ae"); |
$mps .= isis_to_mps($row,'233',2,"ae"); |
376 |
|
|
377 |
|
|
378 |
$bib .= "%sv ".isis_sf($row,'230','v'). |
my $tmp; |
379 |
|
$tmp = isis_sf($row,'230','v'). |
380 |
isis_sf($row,'230','a',' : '). |
isis_sf($row,'230','a',' : '). |
381 |
isis_sf($row,'250',undef,'. - '). |
isis_sf($row,'250',undef,'. - '). |
382 |
isis_sf($row,'260',undef,'. - '). |
isis_sf($row,'260',undef,'. - '). |
383 |
isis_sf($row,'290',undef,'<br>ISBN '). |
isis_sf($row,'290',undef,'<br>ISBN '); |
384 |
"\n"; |
$bib .= "%sv $tmp\n" if ($tmp); |
385 |
$bib .= "%sv ".isis_sf($row,'231','v','<br>'). |
|
386 |
|
$tmp = isis_sf($row,'231','v','<br>'). |
387 |
isis_sf($row,'231','a',' : '). |
isis_sf($row,'231','a',' : '). |
388 |
isis_sf($row,'251',undef,'. - '). |
isis_sf($row,'251',undef,'. - '). |
389 |
isis_sf($row,'261',undef,'. - '). |
isis_sf($row,'261',undef,'. - '). |
390 |
isis_sf($row,'291',undef,'<br>ISBN '). |
isis_sf($row,'291',undef,'<br>ISBN '); |
391 |
"\n"; |
$bib .= "%sv $tmp\n" if ($tmp); |
392 |
$bib .= "%sv ".isis_sf($row,'232','v','<br>'). |
|
393 |
|
$tmp = isis_sf($row,'232','v','<br>'). |
394 |
isis_sf($row,'232','a',' : '). |
isis_sf($row,'232','a',' : '). |
395 |
isis_sf($row,'252',undef,'. - '). |
isis_sf($row,'252',undef,'. - '). |
396 |
isis_sf($row,'262',undef,'. - '). |
isis_sf($row,'262',undef,'. - '). |
397 |
isis_sf($row,'292',undef,'<br>ISBN '). |
isis_sf($row,'292',undef,'<br>ISBN '); |
398 |
"\n"; |
$bib .= "%sv $tmp\n" if ($tmp); |
399 |
$bib .= "%sv ".isis_sf($row,'233','v','<br>'). |
|
400 |
|
$tmp = isis_sf($row,'233','v','<br>'). |
401 |
isis_sf($row,'233','a',' : '). |
isis_sf($row,'233','a',' : '). |
402 |
isis_sf($row,'253',undef,'. - '). |
isis_sf($row,'253',undef,'. - '). |
403 |
isis_sf($row,'263',undef,'. - '). |
isis_sf($row,'263',undef,'. - '). |
404 |
isis_sf($row,'293',undef,'<br>ISBN '). |
isis_sf($row,'293',undef,'<br>ISBN '); |
|
"\n"; |
|
405 |
|
|
406 |
$mps .= isis_to_mps($row,'270',2); |
$mps .= isis_to_mps($row,'270',2); |
407 |
$mps .= isis_to_mps($row,'271',2); |
$mps .= isis_to_mps($row,'271',2); |
408 |
$mps .= isis_to_mps($row,'272',2); |
$mps .= isis_to_mps($row,'272',2); |
409 |
$mps .= isis_to_mps($row,'273',2); |
$mps .= isis_to_mps($row,'273',2); |
410 |
|
|
|
$headline .= isis_sf($row,'700','b'," "); |
|
|
$headline .= isis_sf($row,'700','a'," "); |
|
|
|
|
411 |
# izdavac |
# izdavac |
412 |
$mps .= isis_to_mps($row,'210',3); |
$mps .= isis_to_mps($row,'210',3); |
413 |
$mps .= isis_to_mps($row,'250',3); |
$mps .= isis_to_mps($row,'250',3); |
427 |
$year =~ s/^\s*cop\.*\s*//i; |
$year =~ s/^\s*cop\.*\s*//i; |
428 |
$year =~ s/[\[\]]*//g; |
$year =~ s/[\[\]]*//g; |
429 |
$mps .= "D ${year}\n" if ($year !~ m/\?/ && $year =~ /\d{4}/); |
$mps .= "D ${year}\n" if ($year !~ m/\?/ && $year =~ /\d{4}/); |
|
$headline .= " ($year)"; |
|
430 |
} |
} |
431 |
|
|
432 |
$mps .= isis_to_mps($row,'215',15); |
$mps .= isis_to_mps($row,'215',15); |
471 |
$bib .= isis_to_bib($row,'991','%991'); |
$bib .= isis_to_bib($row,'991','%991'); |
472 |
$mps .= isis_to_mps($row,'991',12); |
$mps .= isis_to_mps($row,'991',12); |
473 |
|
|
474 |
sub store_isn { |
sub isis_isn_to_mps { |
475 |
if (my $isn = shift @_) { |
my $row = shift @_ || die; |
476 |
my $nr = shift @_; |
my $isis_id = shift @_ || die; |
477 |
my $tag = shift @_; |
my $nr = shift @_ || die; |
478 |
|
my $i=0; |
479 |
|
my $mps=''; |
480 |
|
while (my $isn=$row->{$isis_id}->[$i]) { |
481 |
$isn =~ s/ +//g; # remove spaces |
$isn =~ s/ +//g; # remove spaces |
482 |
$mps .= "W $isn $nr\n"; |
$mps .= "W $isn $nr\n"; |
|
$bib .= "$tag $isn\n"; |
|
483 |
if ($isn =~ s/-//g) { |
if ($isn =~ s/-//g) { |
484 |
$mps .= "W $isn $nr\n"; |
$mps .= "W $isn $nr\n"; |
485 |
} |
} |
486 |
|
$i++; |
487 |
} |
} |
488 |
|
return $mps; |
489 |
} |
} |
490 |
|
|
491 |
# ISBN |
# ISBN |
492 |
store_isn($row->{10}->[0],13,'%ISBN'); |
$bib .= isis_to_bib($row,'10','%ISBN'); |
493 |
$mps .= isis_to_mps($row,'290',13); |
$mps .= isis_isn_to_mps($row,'10',13); |
494 |
$mps .= isis_to_mps($row,'291',13); |
$mps .= isis_isn_to_mps($row,'290',13); |
495 |
$mps .= isis_to_mps($row,'292',13); |
$mps .= isis_isn_to_mps($row,'291',13); |
496 |
$mps .= isis_to_mps($row,'293',13); |
$mps .= isis_isn_to_mps($row,'292',13); |
497 |
|
$mps .= isis_isn_to_mps($row,'293',13); |
498 |
|
|
499 |
# ISSN |
# ISSN |
500 |
#store_isn($row->{11}->[0],14,'%ISSN'); |
#store_isn($row->{11}->[0],14,'%ISSN'); |
505 |
|
|
506 |
# headline |
# headline |
507 |
if ($headline) { |
if ($headline) { |
508 |
$headline .= " [".$row->{mfn}."]"; ## debug MFN! |
$headline .= " <i>(".$DatabaseDescriptions{$db_dir}.", ".$row->{mfn}.")</i>"; ## debug MFN! |
509 |
|
$headline =~ s/&/∧/g; |
510 |
|
$headline =~ s/</</g; |
511 |
|
$headline =~ s/>/>/g; |
512 |
|
$headline =~ s/<(\/?[bi])>/<$1>/g; |
513 |
$mps .= "H ".c_852_iso($headline)."\n"; |
$mps .= "H ".c_852_iso($headline)."\n"; |
514 |
} else { |
} else { |
515 |
$mps .= "H nepoznato\n"; |
$mps .= "H nepoznato\n"; |
524 |
#} |
#} |
525 |
|
|
526 |
print R c_852_iso($bib); |
print R c_852_iso($bib); |
527 |
print R "%perl ".Dumper($row)."\n"; |
|
528 |
|
# check if all fields are defined |
529 |
|
foreach (split(/\n/,$bib)) { |
530 |
|
if (/^%(\w+)\s/ && !$default::FieldNames{$1}) { |
531 |
|
die "field $1 used but not in FieldNames"; |
532 |
|
} |
533 |
|
} |
534 |
|
|
535 |
|
# print R "%perl ".Dumper($row)."\n"; |
536 |
|
|
537 |
$mps .= "T document text/plain ".(tell(R) - $last_tell)." $dir/bib $last_tell ".tell(R)."\n"; |
$mps .= "T document text/plain ".(tell(R) - $last_tell)." $dir/bib $last_tell ".tell(R)."\n"; |
538 |
$last_tell=tell(R); |
$last_tell=tell(R); |