git.cweiske.de
/
phinde.git
/ blobdiff
commit
grep
author
committer
pickaxe
?
search:
re
summary
|
shortlog
|
log
|
commit
|
commitdiff
|
tree
raw
|
inline
| side by side
Fix string array access in php 8
[phinde.git]
/
src
/
phinde
/
LinkExtractor
/
Html.php
diff --git
a/src/phinde/LinkExtractor/Html.php
b/src/phinde/LinkExtractor/Html.php
index a6fa8efef8fe9725722bf94bbd137671b73e3afe..299ed912869587ced474b71c61a538a3d0f5b571 100644
(file)
--- a/
src/phinde/LinkExtractor/Html.php
+++ b/
src/phinde/LinkExtractor/Html.php
@@
-8,7
+8,7
@@
class Html
{
public function extract(\HTTP_Request2_Response $res)
{
{
public function extract(\HTTP_Request2_Response $res)
{
- $url =
$res->getEffectiveUrl(
);
+ $url =
Helper::removeAnchor($res->getEffectiveUrl()
);
$linkInfos = array();
$linkInfos = array();
@@
-22,6
+22,13
@@
class Html
$dx = new \DOMXPath($doc);
$dx = new \DOMXPath($doc);
+ $xbase = $dx->evaluate('/html/head/base[@href]')->item(0);
+ if ($xbase) {
+ $base = $base->resolve(
+ $xbase->attributes->getNamedItem('href')->textContent
+ );
+ }
+
$meta = $dx->evaluate('/html/head/meta[@name="robots" and @content]')
->item(0);
if ($meta) {
$meta = $dx->evaluate('/html/head/meta[@name="robots" and @content]')
->item(0);
if ($meta) {
@@
-54,7
+61,7
@@
class Html
}
}
}
}
}
}
- if ($href == '' || $href
{0}
== '#') {
+ if ($href == '' || $href
[0]
== '#') {
//link on this page
continue;
}
//link on this page
continue;
}