From 8b9ae4fc9a3f8402001dd1a054658d5e1246efff Mon Sep 17 00:00:00 2001 From: Christian Weiske Date: Thu, 1 Sep 2016 07:38:08 +0200 Subject: [PATCH] remove anchor from source URLs --- src/phinde/Helper.php | 6 ++++++ src/phinde/LinkExtractor/Html.php | 2 +- 2 files changed, 7 insertions(+), 1 deletion(-) diff --git a/src/phinde/Helper.php b/src/phinde/Helper.php index 43345ba..8e30a19 100644 --- a/src/phinde/Helper.php +++ b/src/phinde/Helper.php @@ -31,6 +31,12 @@ class Helper return 'http://' . $url; } + public static function removeAnchor($url) + { + $parts = explode('#', $url, 2); + return $parts[0]; + } + public static function sanitizeTitle($str) { return trim( diff --git a/src/phinde/LinkExtractor/Html.php b/src/phinde/LinkExtractor/Html.php index 7b987e3..b3a9ea6 100644 --- a/src/phinde/LinkExtractor/Html.php +++ b/src/phinde/LinkExtractor/Html.php @@ -8,7 +8,7 @@ class Html { public function extract(\HTTP_Request2_Response $res) { - $url = $res->getEffectiveUrl(); + $url = Helper::removeAnchor($res->getEffectiveUrl()); $linkInfos = array(); -- 2.30.2