blob: 1e2641a4c91ffb1f1f751f5fc653adce2c8a2fc0 (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
|
<?php
$GLOBALS['phinde'] = array(
'elasticsearch' => 'http://127.0.0.1:9200/phinde/',
//whitelist of domains that shall be crawled
'domains' => array(
'www.example.org',
'test.example.org'
),
//list of URL beginnings that should be ignored
'blacklist' => array(
'http://bad.example.org/'
),
//list of regexes for URLs that should not be crawled
'crawlBlacklist' => array(
),
//list of URLs that should be subscribed to with PubSubHubbub
'subscriptions' => array(
'http://www.example.org/feed',
),
//time in seconds after which URLs may be re-indexed
'refreshtime' => 86400,
//if directly linked URLs shall be indexed, even if they are
// on a non-whitelisted domain
'indexNonAllowed' => true,
//prefix for the gearman queue names, needed when multiple instances
//are running in parallel
'queuePrefix' => '',
//show the full text content in the results
// useful for chat logs in which every line is its own document
'showFullContent' => false,
);
?>
|