diff options
| author | Christian Weiske <cweiske@cweiske.de> | 2016-09-01 07:38:08 +0200 |
|---|---|---|
| committer | Christian Weiske <cweiske@cweiske.de> | 2016-09-01 07:38:08 +0200 |
| commit | 8b9ae4fc9a3f8402001dd1a054658d5e1246efff (patch) | |
| tree | 26a1ad8bdd0856f8a66d7ad2981ec37a0a22e397 | |
| parent | 9d97bab663adb122d6edf7c15639a3457e94c71f (diff) | |
| download | phinde-8b9ae4fc9a3f8402001dd1a054658d5e1246efff.tar.gz phinde-8b9ae4fc9a3f8402001dd1a054658d5e1246efff.zip | |
remove anchor from source URLs
| -rw-r--r-- | src/phinde/Helper.php | 6 | ||||
| -rw-r--r-- | src/phinde/LinkExtractor/Html.php | 2 |
2 files changed, 7 insertions, 1 deletions
diff --git a/src/phinde/Helper.php b/src/phinde/Helper.php index 43345ba..8e30a19 100644 --- a/src/phinde/Helper.php +++ b/src/phinde/Helper.php @@ -31,6 +31,12 @@ class Helper return 'http://' . $url; } + public static function removeAnchor($url) + { + $parts = explode('#', $url, 2); + return $parts[0]; + } + public static function sanitizeTitle($str) { return trim( diff --git a/src/phinde/LinkExtractor/Html.php b/src/phinde/LinkExtractor/Html.php index 7b987e3..b3a9ea6 100644 --- a/src/phinde/LinkExtractor/Html.php +++ b/src/phinde/LinkExtractor/Html.php @@ -8,7 +8,7 @@ class Html { public function extract(\HTTP_Request2_Response $res) { - $url = $res->getEffectiveUrl(); + $url = Helper::removeAnchor($res->getEffectiveUrl()); $linkInfos = array(); |
