diff options
| author | Christian Weiske <cweiske@cweiske.de> | 2016-02-11 20:02:30 +0100 |
|---|---|---|
| committer | Christian Weiske <cweiske@cweiske.de> | 2016-02-11 20:02:30 +0100 |
| commit | e43db7fd25798616ad38a959bd378bb765b9323c (patch) | |
| tree | 5d3db821ab5d4ffe124d755a125f4c5acfd724ff /src/phinde/LinkExtractor/Html.php | |
| parent | d8c39f2b0571b9734259b2f9dc218eed24412332 (diff) | |
| download | phinde-e43db7fd25798616ad38a959bd378bb765b9323c.tar.gz phinde-e43db7fd25798616ad38a959bd378bb765b9323c.zip | |
support base href
Diffstat (limited to 'src/phinde/LinkExtractor/Html.php')
| -rw-r--r-- | src/phinde/LinkExtractor/Html.php | 7 |
1 files changed, 7 insertions, 0 deletions
diff --git a/src/phinde/LinkExtractor/Html.php b/src/phinde/LinkExtractor/Html.php index a6fa8ef..7b987e3 100644 --- a/src/phinde/LinkExtractor/Html.php +++ b/src/phinde/LinkExtractor/Html.php @@ -22,6 +22,13 @@ class Html $dx = new \DOMXPath($doc); + $xbase = $dx->evaluate('/html/head/base[@href]')->item(0); + if ($xbase) { + $base = $base->resolve( + $xbase->attributes->getNamedItem('href')->textContent + ); + } + $meta = $dx->evaluate('/html/head/meta[@name="robots" and @content]') ->item(0); if ($meta) { |
