/[webpac]/trunk2/all2all.pl
This is repository of my old source code which isn't updated any more. Go to git.rot13.org for current projects!
ViewVC logotype

Diff of /trunk2/all2all.pl

Parent Directory Parent Directory | Revision Log Revision Log | View Patch Patch

revision 362 by dpavlin, Wed Jun 16 16:50:30 2004 UTC revision 392 by dpavlin, Wed Jul 21 16:58:27 2004 UTC
# Line 12  use Carp; Line 12  use Carp;
12    
13  use lib './lib';  use lib './lib';
14  use WebPAC;  use WebPAC;
15    use WebPAC::jsFind;
16    
17  my $webpac = new WebPAC(  my $webpac = new WebPAC(
18          code_page => 'ISO-8859-2',          code_page => 'ISO-8859-2',
19          limit_mfn => 500,          limit_mfn => 100,
20    #       debug => 1,
21    ) || die;
22    
23    my $log = $webpac->_get_logger();
24    
25    my $index = new WebPAC::jsFind(
26            index_path => './out/index',
27  ) || die;  ) || die;
28    
29  $|=1;  $|=1;
30    
 print "reading database\n";  
31  my $maxmfn = $webpac->open_isis(  my $maxmfn = $webpac->open_isis(
32          filename => shift @ARGV || '/data/hidra/THS/THS',          filename => shift @ARGV || '/data/hidra/THS/THS',
33          lookup => [          lookup => [
# Line 29  my $maxmfn = $webpac->open_isis( Line 36  my $maxmfn = $webpac->open_isis(
36  #       { 'eval '=> '"v901^a" eq "Mikrotezaurus"', 'key' => 'a:v561^4:v562^4:v461^1', 'val' => 'v900' },  #       { 'eval '=> '"v901^a" eq "Mikrotezaurus"', 'key' => 'a:v561^4:v562^4:v461^1', 'val' => 'v900' },
37  #       { 'eval' => '"v901^a" eq "Deskriptor"', 'key' => 'a:v561^4:v562^4:v461^1', 'val' => 'v900' },  #       { 'eval' => '"v901^a" eq "Deskriptor"', 'key' => 'a:v561^4:v562^4:v461^1', 'val' => 'v900' },
38          { 'key' => 'a:v561^4:v562^4:v461^1', 'val' => 'v900' },          { 'key' => 'a:v561^4:v562^4:v461^1', 'val' => 'v900' },
39            { 'key' => '900_mfn:v900', 'val' => 'v000' },
40          ],          ],
41  );  );
42    
43  print "rows: $maxmfn\n\n";  $log->info("rows: $maxmfn");
44    
45  while (my $rec = $webpac->fetch_rec) {  $webpac->open_import_xml(type => 'isis_hidra_ths');
46    
47          print "-- ",$webpac->parse($rec,'v250^a / [v562^4] v562^a'),"\n";  while (my $rec = $webpac->fetch_rec) {
48    
49          print " ",          my @ds = $webpac->data_structure($rec);
                 $webpac->parse($rec,'eval{v901^a eq "Deskriptor"}v250^a / [v562^4] v562^a'),  
                 $webpac->parse($rec,'eval{v901^a ne "Deskriptor"}250a [251]'),  
                 "\n";  
50    
51          my @t = $webpac->fill_in($rec,'v553^1;;v553^a');          if ($log->is_debug) {
52          print " Uži pojam: ",join("\t\n",@t),"\n" if (@t);                  $log->debug("rec = ",Dumper($rec));
53                    $log->debug("ds = ",Dumper(\@ds));
54            }
55    
56            next if (! @ds);
57    
58            my $filename = $webpac->{'current_filename'};
59    
60            if ($filename) {
61                    open(OUT,"> $filename") || $log->logdie("can't open output '$filename': $!");
62                    print OUT $webpac->output(
63                            template => 'html.tt',
64                            data => \@ds,
65                    );
66                    close(OUT);
67            } else {
68                    print $webpac->output(
69                            template => 'text.tt',
70                            data => \@ds,
71                    );
72            }
73    
74            my $headline;
75            foreach my $ds (@ds) {
76                    if ($ds->{'tag'} eq 'headline') {
77                            $headline = join(" ",@{$ds->{'display'}});
78                            last;
79                    }
80            }
81    
82            my $f = $filename;
83            $f =~ s!out/!!;
84    
85            # save into index
86            foreach my $ds (@ds) {
87                    next if (! $ds->{'swish'});
88    
89                    $index->insert(
90                            index_name => $ds->{'tag'},
91                            path => $f,
92                            headline => $headline,
93                            words => join(" ",@{$ds->{'swish'}})
94                    );
95            }
96    
97          @t = $webpac->fill_in($rec,'eval{v901^a eq "Područje"}[a:v251::];;[d:[a:v251::]]');  #       print Dumper(\@ds);
         print " Područje: ",join("\t\n",@t),"\n" if (@t);  
98    
99          @t = $webpac->fill_in($rec,'eval{v901^a eq "Mikrotezaurus"}[a:v561^4:v251:];;[d:[a:v561^4:v251:]]');  }
         print " Mikrotezaurus: ",join("\t\n",@t),"\n" if (@t);  
100    
101          @t = $webpac->fill_in($rec,'eval{v901^a eq "Deskriptor"}[a:v561^4:v562^4:v900];;[d:[a:v561^4:v562^4:v900]]');  if ($log->is_debug) {
102          print " Deskriptor: ",join("\t\n",@t),"\n" if (@t);          $log->debug("lookup hash: ",Dumper($webpac->{'lookup'}));
103            $log->debug("data hash: ",Dumper($webpac->{'data'}));
104  }  }
105    
106  print "## lookup ",Dumper($webpac->{'lookup'});  $index->close;
107  print "## data ",Dumper($webpac->{'data'});  

Legend:
Removed from v.362  
changed lines
  Added in v.392

  ViewVC Help
Powered by ViewVC 1.1.26