--- trunk/spider/swishspider 2003/03/24 09:57:44 30 +++ trunk/spider/swishspider 2003/04/30 12:40:09 32 @@ -73,6 +73,9 @@ # > # which will confuse indexer (or libxml2?) $contents =~ s/[\n\r]^(>)/$1\n/msg; + # remove comments between and texi2html inserts them + # there and swish can't find document title then (libxml or swish bug?) + while ($contents =~ s/(.*)(.*)/$1$2/msi) { }; print CONTENTS $contents; close( CONTENTS );