/[meteor]/trunk/Meteor/Koha.pm
This is repository of my old source code which isn't updated any more. Go to git.rot13.org for current projects!
ViewVC logotype

Annotation of /trunk/Meteor/Koha.pm

Parent Directory Parent Directory | Revision Log Revision Log


Revision 79 - (hide annotations)
Sun Mar 29 00:11:48 2009 UTC (15 years, 1 month ago) by dpavlin
File size: 1372 byte(s)
use HTML::Query and half of CPAN to nicely parse html
from Koha with CSS expressions
1 dpavlin 70 package Meteor::Koha;
2    
3     use strict;
4     use warnings;
5    
6     use LWP::UserAgent;
7    
8     my $ua = LWP::UserAgent->new;
9    
10 dpavlin 71 our $cache;
11    
12 dpavlin 79 use HTML::Query qw/Query/;
13     use File::Slurp;
14     use Encode qw/decode/;
15     use Data::Dump qw/dump/;
16    
17 dpavlin 70 sub item {
18     my ( $class, $client, $item ) = @_;
19    
20 dpavlin 71 my $html;
21 dpavlin 77 my $status = 200;
22 dpavlin 70
23 dpavlin 79 my $path = "cache/$item.html";
24    
25 dpavlin 71 if ( $html = $cache->{$item} ) {
26 dpavlin 70
27 dpavlin 71 warn "# koha item $item from cache\n";
28 dpavlin 70
29 dpavlin 79 } elsif ( 0 && -e $path ) { # FIXME enable
30    
31     $html = $cache->{$item} = read_file( $path );
32    
33 dpavlin 71 } else {
34    
35     my $url = 'http://koha.ffzg.hr/cgi-bin/koha/opac-detail.pl?biblionumber=' . $item;
36    
37     my $response = $ua->get( $url );
38    
39 dpavlin 77 if ($response->is_success) {
40 dpavlin 71
41 dpavlin 77 $html = $response->content;
42    
43 dpavlin 79 write_file( "cache/$item.koha.html", $html );
44    
45     warn "## size before: ", length( $html );
46    
47     $html = decode( 'utf-8', $html );
48     my $q = Query( text => $html, 'div.container' )
49     || die;
50     $html = $q->as_HTML->[0];
51    
52     warn "## size after: ", length( $html ), dump( $html );
53    
54 dpavlin 77 $cache->{$item} = $html;
55 dpavlin 79 write_file( $path, $html );
56 dpavlin 77
57     } else {
58    
59     $html = qq{Can't load $item } . $response->status_line;
60     # $status = 404;
61    
62     }
63 dpavlin 71 }
64    
65 dpavlin 70 my $len = length($html);
66    
67     warn "# koha item $item [$len]\n";
68    
69     $client->write(
70 dpavlin 77 "HTTP/1.1 $status OK\r\n" .
71 dpavlin 70 "Content-Type: text/html\r\n" .
72     "Content-length: $len\r\n" .
73     "Connection: close\r\n" .
74     "\r\n\r\n$html\r\n"
75     );
76    
77     }
78    
79     1;

  ViewVC Help
Powered by ViewVC 1.1.26