68 |
#(default 60) The number of seconds to wait between issuing |
#(default 60) The number of seconds to wait between issuing |
69 |
#requests to a server. |
#requests to a server. |
70 |
|
|
71 |
SpiderDirectory /data/swish/spider |
SpiderDirectory /rest/references/swish/spider |
72 |
|
|
73 |
#EquivalentServer http://portal.pliva.hr http://www.pliva.hr |
#EquivalentServer http://portal.pliva.hr http://www.pliva.hr |
74 |
#(default nothing) This allows you to deal with |
#(default nothing) This allows you to deal with |
93 |
|
|
94 |
# index pdf |
# index pdf |
95 |
IndexContents HTML .pdf |
IndexContents HTML .pdf |
96 |
FileFilter .pdf pdftotext "-htmlmeta '%p' -" |
FileFilter .pdf pdftotext "-htmlmeta '%p' -" |
97 |
|
|
98 |
# various other |
# various other |
99 |
FileFilter .gz gzip "-cd '%p'" |
FileFilter .tar.gz tar "tvfz '%p'" |
100 |
FileFilter .bz2 bzip2 "-cd '%p'" |
FileFilter .gz gzip "-cd '%p'" |
101 |
|
FileFilter .bz2 bzip2 "-cd '%p'" |
102 |
|
|
103 |
|
# regex version of above |
104 |
|
#FileFilterMatch tar "tvfz '%p'" /\.tar\.gz/i |
105 |
|
#FileFilterMatch gzip "-cd '%p'" /\.gz/i |
106 |
|
#FileFilterMatch bzip2 "-cd '%p'" /\.bz2/i |
107 |
|
|
108 |
# store path of document |
# store path of document, title |
109 |
MetaNames swishdocpath |
MetaNames swishdocpath swishtitle |
110 |
|
|
111 |
# debug |
# debug |
112 |
ParserWarnLevel 3 |
ParserWarnLevel 3 |