/[irc-logger]/trunk/irc-logger.pl
This is repository of my old source code which isn't updated any more. Go to git.rot13.org for current projects!
ViewVC logotype

Annotation of /trunk/irc-logger.pl

Parent Directory Parent Directory | Revision Log Revision Log


Revision 28 - (hide annotations)
Fri Jun 16 20:51:32 2006 UTC (17 years, 9 months ago) by dpavlin
File MIME type: text/plain
File size: 15046 byte(s)
added tags to html interface

1 dpavlin 4 #!/usr/bin/perl -w
2     use strict;
3     $|++;
4    
5 dpavlin 5 =head1 NAME
6    
7     irc-logger.pl
8    
9     =head1 SYNOPSIS
10    
11     ./irc-logger.pl
12    
13     =head1 DESCRIPTION
14    
15     log all conversation on irc channel
16    
17     =cut
18    
19 dpavlin 4 ## CONFIG
20    
21 dpavlin 28 my $NICK = 'irc-logger-dev';
22 dpavlin 4 my $CONNECT =
23     {Server => 'irc.freenode.net',
24     Nick => $NICK,
25 dpavlin 8 Ircname => "try /msg $NICK help",
26 dpavlin 4 };
27     my $CHANNEL = '#razmjenavjestina';
28     my $IRC_ALIAS = "log";
29    
30     my %FOLLOWS =
31     (
32     ACCESS => "/var/log/apache/access.log",
33     ERROR => "/var/log/apache/error.log",
34     );
35    
36 dpavlin 19 my $DSN = 'DBI:Pg:dbname=' . $NICK;
37 dpavlin 5
38 dpavlin 14 my $ENCODING = 'ISO-8859-2';
39    
40 dpavlin 4 ## END CONFIG
41    
42 dpavlin 5
43    
44 dpavlin 13 use POE qw(Component::IRC Wheel::FollowTail Component::Server::HTTP);
45     use HTTP::Status;
46 dpavlin 5 use DBI;
47 dpavlin 6 use Encode qw/from_to/;
48 dpavlin 15 use Regexp::Common qw /URI/;
49 dpavlin 16 use CGI::Simple;
50 dpavlin 28 use HTML::TagCloud;
51 dpavlin 5
52     my $dbh = DBI->connect($DSN,"","", { RaiseError => 1, AutoCommit => 1 }) || die $DBI::errstr;
53    
54 dpavlin 19 eval {
55     $dbh->do(qq{ select count(*) from log });
56     };
57 dpavlin 5
58 dpavlin 19 if ($@) {
59     warn "creating database table in $DSN\n";
60     $dbh->do(<<'_SQL_SCHEMA_');
61    
62 dpavlin 5 create table log (
63     id serial,
64     time timestamp default now(),
65     channel text not null,
66 dpavlin 19 me boolean default false,
67 dpavlin 5 nick text not null,
68     message text not null,
69     primary key(id)
70     );
71    
72     create index log_time on log(time);
73     create index log_channel on log(channel);
74     create index log_nick on log(nick);
75    
76 dpavlin 19 _SQL_SCHEMA_
77     }
78 dpavlin 5
79     my $sth = $dbh->prepare(qq{
80     insert into log
81 dpavlin 19 (channel, me, nick, message)
82     values (?,?,?,?)
83 dpavlin 5 });
84    
85 dpavlin 28 my $tags;
86    
87 dpavlin 11 =head2 get_from_log
88 dpavlin 5
89 dpavlin 11 my @messages = get_from_log(
90     limit => 42,
91     search => '%what to stuff in ilike%',
92 dpavlin 13 fmt => {
93     time => '{%s} ',
94     time_channel => '{%s %s} ',
95     nick => '%s: ',
96 dpavlin 20 me_nick => '***%s ',
97 dpavlin 13 message => '%s',
98     },
99 dpavlin 20 filter => {
100     message => sub {
101     # modify message content
102     return shift;
103     }
104 dpavlin 21 },
105     context => 5,
106 dpavlin 11 );
107    
108 dpavlin 20 Order is important. Fields are first passed through C<filter> (if available) and
109     then throgh C<< sprintf($fmt->{message}, $message >> if available.
110    
111 dpavlin 21 C<context> defines number of messages around each search hit for display.
112    
113 dpavlin 11 =cut
114    
115     sub get_from_log {
116     my $args = {@_};
117    
118     $args->{limit} ||= 10;
119    
120 dpavlin 13 $args->{fmt} ||= {
121 dpavlin 26 date => '[%s] ',
122 dpavlin 13 time => '{%s} ',
123     time_channel => '{%s %s} ',
124     nick => '%s: ',
125 dpavlin 20 me_nick => '***%s ',
126 dpavlin 13 message => '%s',
127     };
128    
129 dpavlin 21 my $sql_message = qq{
130 dpavlin 11 select
131     time::date as date,
132     time::time as time,
133     channel,
134 dpavlin 20 me,
135 dpavlin 11 nick,
136     message
137     from log
138     };
139 dpavlin 21
140     my $sql_context = qq{
141     select
142     id
143     from log
144     };
145    
146     my $context = $1 if ($args->{search} && $args->{search} =~ s/\s*\+(\d+)\s*/ /);
147    
148     my $sql = $context ? $sql_context : $sql_message;
149    
150 dpavlin 25 $sql .= " where message ilike ? or nick ilike ? " if ($args->{search});
151 dpavlin 28 $sql .= " where id in (" . join(",", @{ $tags->{ $args->{tag} } }) . ") " if ($args->{tag} && $tags->{ $args->{tag} });
152 dpavlin 11 $sql .= " order by log.time desc";
153     $sql .= " limit " . $args->{limit};
154    
155     my $sth = $dbh->prepare( $sql );
156 dpavlin 21 if (my $search = $args->{search}) {
157     $search =~ s/^\s+//;
158     $search =~ s/\s+$//;
159 dpavlin 25 $sth->execute( ( '%' . $search . '%' ) x 2 );
160 dpavlin 21 warn "search for '$search' returned ", $sth->rows, " results ", $context || '', "\n";
161 dpavlin 28 } elsif (my $tag = $args->{tag}) {
162     $sth->execute();
163     warn "tag '$tag' returned ", $sth->rows, " results ", $context || '', "\n";
164 dpavlin 11 } else {
165     $sth->execute();
166     }
167     my $last_row = {
168     date => '',
169     time => '',
170     channel => '',
171     nick => '',
172     };
173    
174     my @rows;
175    
176     while (my $row = $sth->fetchrow_hashref) {
177     unshift @rows, $row;
178     }
179    
180 dpavlin 16 my @msgs = (
181     "Showing " . ($#rows + 1) . " messages..."
182     );
183 dpavlin 11
184 dpavlin 21 if ($context) {
185     my @ids = @rows;
186     @rows = ();
187    
188     my $last_to = 0;
189    
190     my $sth = $dbh->prepare( $sql_message . qq{ where id >= ? and id < ? } );
191     foreach my $row_id (sort { $a->{id} <=> $b->{id} } @ids) {
192     my $id = $row_id->{id} || die "can't find id in row";
193    
194     my ($from, $to) = ($id - $context, $id + $context);
195     $from = $last_to if ($from < $last_to);
196     $last_to = $to;
197     $sth->execute( $from, $to );
198    
199     #warn "## id: $id from: $from to: $to returned: ", $sth->rows, "\n";
200    
201     while (my $row = $sth->fetchrow_hashref) {
202     push @rows, $row;
203     }
204    
205     }
206     }
207    
208 dpavlin 11 foreach my $row (@rows) {
209    
210     $row->{time} =~ s#\.\d+##;
211    
212     my $msg = '';
213    
214 dpavlin 26 $msg = sprintf($args->{fmt}->{date}, $row->{date}) . ' ' if ($last_row->{date} ne $row->{date});
215     my $t = $row->{time};
216    
217 dpavlin 13 if ($last_row->{channel} ne $row->{channel}) {
218     $msg .= sprintf($args->{fmt}->{time_channel}, $t, $row->{channel});
219     } else {
220     $msg .= sprintf($args->{fmt}->{time}, $t);
221     }
222 dpavlin 11
223 dpavlin 12 my $append = 1;
224 dpavlin 11
225 dpavlin 22 my $nick = $row->{nick};
226 dpavlin 24 if ($nick =~ s/^_*(.*?)_*$/$1/) {
227     $row->{nick} = $nick;
228     }
229    
230 dpavlin 22 if ($last_row->{nick} ne $nick) {
231 dpavlin 20 # obfu way to find format for me_nick if needed or fallback to default
232     my $fmt = $row->{me} ? ( $args->{fmt}->{me_nick} || $args->{fmt}->{nick} ) : $args->{fmt}->{nick};
233     $fmt ||= '%s';
234    
235     $nick = $args->{filter}->{nick}->($nick) if (ref($args->{filter}->{nick}) eq 'CODE');
236    
237     $msg .= sprintf( $fmt, $nick );
238 dpavlin 12 $append = 0;
239     }
240    
241 dpavlin 20 $args->{fmt}->{message} ||= '%s';
242     if (ref($args->{filter}->{message}) eq 'CODE') {
243 dpavlin 15 $msg .= sprintf($args->{fmt}->{message},
244 dpavlin 20 $args->{filter}->{message}->(
245 dpavlin 15 $row->{message}
246     )
247     );
248     } else {
249     $msg .= sprintf($args->{fmt}->{message}, $row->{message});
250     }
251 dpavlin 11
252 dpavlin 12 if ($append && @msgs) {
253     $msgs[$#msgs] .= " " . $msg;
254     } else {
255     push @msgs, $msg;
256     }
257 dpavlin 11
258     $last_row = $row;
259     }
260    
261     return @msgs;
262     }
263    
264    
265 dpavlin 4 my $SKIPPING = 0; # if skipping, how many we've done
266     my $SEND_QUEUE; # cache
267    
268     POE::Component::IRC->new($IRC_ALIAS);
269    
270     POE::Session->create
271     (inline_states =>
272     {_start => sub {
273 dpavlin 7 $_[KERNEL]->post($IRC_ALIAS => register => 'all');
274     $_[KERNEL]->post($IRC_ALIAS => connect => $CONNECT);
275 dpavlin 4 },
276 dpavlin 9 irc_255 => sub { # server is done blabbing
277 dpavlin 7 $_[KERNEL]->post($IRC_ALIAS => join => $CHANNEL);
278     $_[KERNEL]->post($IRC_ALIAS => join => '#logger');
279     $_[KERNEL]->yield("heartbeat"); # start heartbeat
280     # $_[KERNEL]->yield("my_add", $_) for keys %FOLLOWS;
281 dpavlin 11 $_[KERNEL]->post( $IRC_ALIAS => privmsg => 'nickserv', "IDENTIFY $NICK" );
282 dpavlin 4 },
283     irc_public => sub {
284 dpavlin 7 my $kernel = $_[KERNEL];
285     my $nick = (split /!/, $_[ARG0])[0];
286     my $channel = $_[ARG1]->[0];
287     my $msg = $_[ARG2];
288 dpavlin 4
289 dpavlin 14 from_to($msg, 'UTF-8', $ENCODING);
290 dpavlin 6
291 dpavlin 7 print "$channel: <$nick> $msg\n";
292 dpavlin 19 $sth->execute($channel, 0, $nick, $msg);
293 dpavlin 4 },
294 dpavlin 19 irc_ctcp_action => sub {
295     my $kernel = $_[KERNEL];
296     my $nick = (split /!/, $_[ARG0])[0];
297     my $channel = $_[ARG1]->[0];
298     my $msg = $_[ARG2];
299    
300     from_to($msg, 'UTF-8', $ENCODING);
301    
302     print "$channel ***$nick $msg\n";
303     $sth->execute($channel, 1, $nick, $msg);
304     },
305 dpavlin 7 irc_msg => sub {
306     my $kernel = $_[KERNEL];
307     my $nick = (split /!/, $_[ARG0])[0];
308     my $msg = $_[ARG2];
309 dpavlin 14 from_to($msg, 'UTF-8', $ENCODING);
310 dpavlin 7
311 dpavlin 8 my $res = "unknown command '$msg', try /msg $NICK help!";
312 dpavlin 11 my @out;
313 dpavlin 7
314     print "<< $msg\n";
315    
316 dpavlin 8 if ($msg =~ m/^help/i) {
317 dpavlin 7
318 dpavlin 11 $res = "usage: /msg $NICK comand | commands: stat - user/message stat | last - show backtrace | grep foobar - find foobar";
319 dpavlin 8
320 dpavlin 10 } elsif ($msg =~ m/^msg\s+(\S+)\s+(.*)$/i) {
321    
322     print ">> /msg $1 $2\n";
323     $_[KERNEL]->post( $IRC_ALIAS => privmsg => $1, $2 );
324     $res = '';
325    
326 dpavlin 8 } elsif ($msg =~ m/^stat.*?\s*(\d*)/i) {
327    
328 dpavlin 7 my $nr = $1 || 10;
329    
330     my $sth = $dbh->prepare(qq{
331     select nick,count(*) from log group by nick order by count desc limit $nr
332     });
333     $sth->execute();
334     $res = "Top $nr users: ";
335 dpavlin 8 my @users;
336 dpavlin 7 while (my $row = $sth->fetchrow_hashref) {
337 dpavlin 8 push @users,$row->{nick} . ': ' . $row->{count};
338 dpavlin 7 }
339 dpavlin 8 $res .= join(" | ", @users);
340     } elsif ($msg =~ m/^last.*?\s*(\d*)/i) {
341    
342 dpavlin 11 foreach my $res (get_from_log( limit => $1 )) {
343     print "last: $res\n";
344 dpavlin 14 from_to($res, $ENCODING, 'UTF-8');
345 dpavlin 11 $_[KERNEL]->post( $IRC_ALIAS => privmsg => $nick, $res );
346 dpavlin 8 }
347    
348 dpavlin 11 $res = '';
349 dpavlin 8
350 dpavlin 21 } elsif ($msg =~ m/^(search|grep)\s+(.*)\s*$/i) {
351 dpavlin 8
352 dpavlin 11 my $what = $2;
353 dpavlin 8
354 dpavlin 21 foreach my $res (get_from_log(
355     limit => 20,
356     search => $what,
357     )) {
358 dpavlin 11 print "search [$what]: $res\n";
359 dpavlin 14 from_to($res, $ENCODING, 'UTF-8');
360 dpavlin 8 $_[KERNEL]->post( $IRC_ALIAS => privmsg => $nick, $res );
361     }
362    
363     $res = '';
364 dpavlin 11
365 dpavlin 7 }
366    
367 dpavlin 8 if ($res) {
368     print ">> [$nick] $res\n";
369 dpavlin 14 from_to($res, $ENCODING, 'UTF-8');
370 dpavlin 8 $_[KERNEL]->post( $IRC_ALIAS => privmsg => $nick, $res );
371     }
372 dpavlin 7
373     },
374 dpavlin 10 irc_477 => sub {
375     print "# irc_477: ",$_[ARG1], "\n";
376     $_[KERNEL]->post( $IRC_ALIAS => privmsg => 'nickserv', "register $NICK" );
377     },
378 dpavlin 7 irc_505 => sub {
379 dpavlin 10 print "# irc_505: ",$_[ARG1], "\n";
380 dpavlin 7 $_[KERNEL]->post( $IRC_ALIAS => privmsg => 'nickserv', "register $NICK" );
381 dpavlin 10 # $_[KERNEL]->post( $IRC_ALIAS => privmsg => 'nickserv', "set hide email on" );
382     # $_[KERNEL]->post( $IRC_ALIAS => privmsg => 'nickserv', "set email dpavlin\@rot13.org" );
383 dpavlin 8 },
384     irc_registered => sub {
385 dpavlin 10 warn "## indetify $NICK\n";
386 dpavlin 7 $_[KERNEL]->post( $IRC_ALIAS => privmsg => 'nickserv', "IDENTIFY $NICK" );
387 dpavlin 10 },
388 dpavlin 11 # irc_433 => sub {
389     # print "# irc_433: ",$_[ARG1], "\n";
390     # warn "## indetify $NICK\n";
391     # $_[KERNEL]->post( $IRC_ALIAS => privmsg => 'nickserv', "IDENTIFY $NICK" );
392     # },
393 dpavlin 10 irc_372 => sub {
394     print "MOTD: ", $_[ARG1], "\n";
395     },
396     irc_snotice => sub {
397     print "(server notice): ", $_[ARG0], "\n";
398     },
399 dpavlin 4 (map
400     {
401     ;"irc_$_" => sub { }}
402 dpavlin 10 qw(
403 dpavlin 5 )),
404 dpavlin 10 # join
405     # ctcp_version
406     # connected snotice ctcp_action ping notice mode part quit
407     # 001 002 003 004 005
408     # 250 251 252 253 254 265 266
409     # 332 333 353 366 372 375 376
410     # 477
411 dpavlin 4 _child => sub {},
412     _default => sub {
413     printf "%s: session %s caught an unhandled %s event.\n",
414     scalar localtime(), $_[SESSION]->ID, $_[ARG0];
415     print "The $_[ARG0] event was given these parameters: ",
416     join(" ", map({"ARRAY" eq ref $_ ? "[@$_]" : "$_"} @{$_[ARG1]})), "\n";
417     0; # false for signals
418     },
419     my_add => sub {
420     my $trailing = $_[ARG0];
421     my $session = $_[SESSION];
422     POE::Session->create
423     (inline_states =>
424     {_start => sub {
425     $_[HEAP]->{wheel} =
426     POE::Wheel::FollowTail->new
427     (
428     Filename => $FOLLOWS{$trailing},
429     InputEvent => 'got_line',
430     );
431     },
432     got_line => sub {
433     $_[KERNEL]->post($session => my_tailed =>
434     time, $trailing, $_[ARG0]);
435     },
436     },
437     );
438    
439     },
440     my_tailed => sub {
441     my ($time, $file, $line) = @_[ARG0..ARG2];
442     ## $time will be undef on a probe, or a time value if a real line
443    
444     ## PoCo::IRC has throttling built in, but no external visibility
445     ## so this is reaching "under the hood"
446     $SEND_QUEUE ||=
447     $_[KERNEL]->alias_resolve($IRC_ALIAS)->get_heap->{send_queue};
448    
449     ## handle "no need to keep skipping" transition
450     if ($SKIPPING and @$SEND_QUEUE < 1) {
451     $_[KERNEL]->post($IRC_ALIAS => privmsg => $CHANNEL =>
452     "[discarded $SKIPPING messages]");
453     $SKIPPING = 0;
454     }
455    
456     ## handle potential message display
457     if ($time) {
458     if ($SKIPPING or @$SEND_QUEUE > 3) { # 3 msgs per 10 seconds
459     $SKIPPING++;
460     } else {
461     my @time = localtime $time;
462     $_[KERNEL]->post($IRC_ALIAS => privmsg => $CHANNEL =>
463     sprintf "%02d:%02d:%02d: %s: %s",
464     ($time[2] + 11) % 12 + 1, $time[1], $time[0],
465     $file, $line);
466     }
467     }
468    
469     ## handle re-probe/flush if skipping
470     if ($SKIPPING) {
471     $_[KERNEL]->delay($_[STATE] => 0.5); # $time will be undef
472     }
473    
474     },
475     my_heartbeat => sub {
476     $_[KERNEL]->yield(my_tailed => time, "heartbeat", "beep");
477     $_[KERNEL]->delay($_[STATE] => 10);
478     }
479     },
480     );
481    
482 dpavlin 28 # tags support
483    
484     my $cloud = HTML::TagCloud->new;
485    
486     =head2 add_tag
487    
488     add_tag( id => 42, message => 'irc message' );
489    
490     =cut
491    
492     sub add_tag {
493     my $arg = {@_};
494    
495     return unless ($arg->{id} && $arg->{message});
496    
497     while ($arg->{message} =~ s#\b(\S+)//##s) {
498     my $tag = $1;
499     next if (! $tag || $tag =~ m/https?:/i);
500     push @{ $tags->{$tag} }, $arg->{id};
501     }
502     }
503    
504     =head2 seed_tags
505    
506     Read all tags from database and create in-memory cache for tags
507    
508     =cut
509    
510     sub seed_tags {
511     my $sth = $dbh->prepare(qq{ select id,message from log where message like '%//%' });
512     $sth->execute;
513     while (my $row = $sth->fetchrow_hashref) {
514     add_tag( %$row );
515     }
516    
517     foreach my $tag (keys %$tags) {
518     $cloud->add($tag, "?tag=$tag", scalar @{$tags->{$tag}} + 1);
519     }
520     }
521    
522     seed_tags;
523    
524 dpavlin 13 # http server
525    
526     my $httpd = POE::Component::Server::HTTP->new(
527 dpavlin 14 Port => $NICK =~ m/-dev/ ? 8001 : 8000,
528 dpavlin 13 ContentHandler => { '/' => \&root_handler },
529     Headers => { Server => 'irc-logger' },
530     );
531    
532 dpavlin 18 my %escape = ('<'=>'&lt;', '>'=>'&gt;', '&'=>'&amp;', '"'=>'&quot;');
533     my $escape_re = join '|' => keys %escape;
534    
535 dpavlin 13 my $style = <<'_END_OF_STYLE_';
536 dpavlin 16 p { margin: 0; padding: 0.1em; }
537 dpavlin 13 .time, .channel { color: #808080; font-size: 60%; }
538 dpavlin 28 .date { float: right; background: #e0e0e0; color: #404040; font-size: 120%; padding: 0.25em; border: 1px dashed #808080; }
539 dpavlin 20 .nick { color: #000000; font-size: 80%; padding: 2px; font-family: courier, courier new, monospace ; }
540 dpavlin 13 .message { color: #000000; font-size: 100%; }
541 dpavlin 16 .search { float: right; }
542 dpavlin 20 .col-0 { background: #ffff66 }
543     .col-1 { background: #a0ffff }
544     .col-2 { background: #99ff99 }
545     .col-3 { background: #ff9999 }
546     .col-4 { background: #ff66ff }
547 dpavlin 13 _END_OF_STYLE_
548    
549 dpavlin 20 my $max_color = 4;
550    
551     my %nick_enumerator;
552    
553 dpavlin 13 sub root_handler {
554     my ($request, $response) = @_;
555     $response->code(RC_OK);
556 dpavlin 14 $response->content_type("text/html; charset=$ENCODING");
557 dpavlin 16
558     my $q;
559    
560     if ( $request->method eq 'POST' ) {
561     $q = new CGI::Simple( $request->content );
562     } elsif ( $request->uri =~ /\?(.+)$/ ) {
563     $q = new CGI::Simple( $1 );
564     } else {
565     $q = new CGI::Simple;
566     }
567    
568     my $search = $q->param('search') || $q->param('grep') || '';
569    
570 dpavlin 13 $response->content(
571 dpavlin 28 qq{<html><head><title>$NICK</title><style type="text/css">$style} .
572     $cloud->css .
573     qq{</style></head><body>} .
574     qq{
575 dpavlin 16 <form method="post" class="search">
576     <input type="text" name="search" value="$search" size="10">
577     <input type="submit" value="search">
578     </form>
579     } .
580 dpavlin 28 qq{<div>} . $cloud->html(500) . qq{</div>} .
581     qq{<p>} .
582 dpavlin 16 join("</p><p>",
583 dpavlin 13 get_from_log(
584 dpavlin 23 limit => $q->param('last') || 100,
585 dpavlin 28 search => $search || undef,
586     tag => $q->param('tag'),
587 dpavlin 13 fmt => {
588 dpavlin 27 date => '<hr size="1" style="clear: both;"/><div class="date">%s</div> ',
589 dpavlin 13 time => '<span class="time">%s</span> ',
590     time_channel => '<span class="channel">%s %s</span> ',
591 dpavlin 20 nick => '%s:&nbsp;',
592     me_nick => '***%s&nbsp;',
593 dpavlin 13 message => '<span class="message">%s</span>',
594     },
595 dpavlin 20 filter => {
596     message => sub {
597     my $m = shift || return;
598     $m =~ s/($escape_re)/$escape{$1}/gs;
599     $m =~ s#($RE{URI}{HTTP})#<a href="$1">$1</a>#gs;
600     return $m;
601     },
602     nick => sub {
603     my $n = shift || return;
604     if (! $nick_enumerator{$n}) {
605     my $max = scalar keys %nick_enumerator;
606     $nick_enumerator{$n} = $max + 1;
607     }
608     return '<span class="nick col-' .
609     ( $nick_enumerator{$n} % $max_color ) .
610     '">' . $n . '</span>';
611     },
612 dpavlin 15 },
613 dpavlin 13 )
614     ) .
615 dpavlin 16 qq{</p></body></html>}
616 dpavlin 13 );
617     return RC_OK;
618     }
619    
620 dpavlin 4 POE::Kernel->run;

Properties

Name Value
svn:executable *

  ViewVC Help
Powered by ViewVC 1.1.26