X-Git-Url: https://git.cweiske.de/phinde.git/blobdiff_plain/d7651fd96dcfa2829519504e4c8ec1ce511cd57f..f98e891b454e5677bdf61f476e366b01af713b50:/src/phinde/Fetcher.php diff --git a/src/phinde/Fetcher.php b/src/phinde/Fetcher.php index b5644af..dccb118 100644 --- a/src/phinde/Fetcher.php +++ b/src/phinde/Fetcher.php @@ -43,7 +43,7 @@ class Fetcher $res = $req->send(); if ($res->getStatus() === 304) { //not modified since last time, so don't crawl again - echo "Not modified since last fetch\n"; + Log::info("Not modified since last fetch"); return false; } else if ($res->getStatus() !== 200) { throw new \Exception( @@ -52,7 +52,7 @@ class Fetcher ); } - $effUrl = $res->getEffectiveUrl(); + $effUrl = Helper::removeAnchor($res->getEffectiveUrl()); if ($effUrl != $url) { $this->storeRedirect($url, $effUrl); $url = $effUrl; @@ -69,17 +69,17 @@ class Fetcher protected function storeRedirect($url, $target) { - $esDoc = new \stdClass(); + $esDoc = Helper::baseDoc($url); $esDoc->status = (object) array( - 'location' => $target + 'location' => $target, + 'findable' => false, ); - $esDoc->url = $url; $this->storeDoc($url, $esDoc); } public function storeDoc($url, $esDoc) { - echo "Store $url\n"; + Log::info("Store $url"); $esDoc->status->processed = gmdate('c'); $r = new Elasticsearch_Request( $GLOBALS['phinde']['elasticsearch'] . 'document/'