aboutsummaryrefslogtreecommitdiff
path: root/src/phinde
diff options
context:
space:
mode:
authorChristian Weiske <cweiske@cweiske.de>2016-08-30 08:13:33 +0200
committerChristian Weiske <cweiske@cweiske.de>2016-08-30 08:13:33 +0200
commit45638a5de3c8c05c1792f8a3ab93acb11a2c1a86 (patch)
tree47f67feac7e1d85d42b6f36427acfd77e0d3a7d3 /src/phinde
parent59f931647a2b4a13be20ba8f2baa4ec93e334ee5 (diff)
downloadphinde-45638a5de3c8c05c1792f8a3ab93acb11a2c1a86.tar.gz
phinde-45638a5de3c8c05c1792f8a3ab93acb11a2c1a86.zip
Option to disable linked URL indexing
Resolves: #2
Diffstat (limited to 'src/phinde')
-rw-r--r--src/phinde/Crawler.php18
1 files changed, 13 insertions, 5 deletions
diff --git a/src/phinde/Crawler.php b/src/phinde/Crawler.php
index 43d9459..6459fb4 100644
--- a/src/phinde/Crawler.php
+++ b/src/phinde/Crawler.php
@@ -84,11 +84,19 @@ class Crawler
if ($this->es->isKnown($linkInfo->url)) {
continue;
}
- $this->es->markQueued($linkInfo->url);
- $this->queue->addToIndex(
- $linkInfo->url, $linkInfo->title, $linkInfo->source
- );
- if (Helper::isUrlAllowed($linkInfo->url)) {
+ $allowed = Helper::isUrlAllowed($linkInfo->url);
+ $crawl = $allowed;
+ $index = $GLOBALS['phinde']['indexNonAllowed'] || $allowed;
+
+ if ($crawl || $index) {
+ $this->es->markQueued($linkInfo->url);
+ }
+ if ($index) {
+ $this->queue->addToIndex(
+ $linkInfo->url, $linkInfo->title, $linkInfo->source
+ );
+ }
+ if ($allowed) {
$this->queue->addToCrawl($linkInfo->url);
}
}