url = trim($url);
}
public function parse()
{
if ($this->url == '') {
$this->error = 'Empty fork URL';
return false;
}
$arUrl = parse_url($this->url);
$scheme = isset($arUrl['scheme']) ? $arUrl['scheme'] : '';
if ($scheme == 'https' && isset($arUrl['host'])
&& $arUrl['host'] == 'gist.github.com'
) {
$this->arGitUrls[][] = 'git://gist.github.com/'
. ltrim($arUrl['path'], '/') . '.git';
return true;
}
switch ($scheme) {
case 'git':
//clearly a git url
$this->arGitUrls = array(array($this->url));
return true;
case 'ssh':
//FIXME: maybe loosen this when we know how to skip the
//"do you trust this server" question of ssh
$this->error = 'ssh:// URLs are not supported';
return false;
case 'http':
case 'https':
return $this->extractUrlsFromHtml($this->url);
}
$this->error = 'Unknown URLs scheme: ' . $scheme;
return false;
}
protected function extractUrlsFromHtml($url)
{
//HTML is not necessarily well-formed, and Gitorious has many problems
// in this regard
//$sx = simplexml_load_file($url);
libxml_use_internal_errors(true);
$sx = simplexml_import_dom(\DomDocument::loadHtmlFile($url));
$elems = $sx->xpath('//*[@rel="vcs-git"]');
$count = $anonymous = 0;
foreach ($elems as $elem) {
if (!isset($elem['href'])) {
continue;
}
$str = (string)$elem;
if (isset($elem['title'])) {
//
$title = (string)$elem['title'];
} else if ($str != '') {
//title
$title = $str;
} else {
$title = 'Unnamed repository #' . ++$anonymous;
}
$url = (string)$elem['href'];
if ($this->isSupported($url)) {
++$count;
$this->arGitUrls[$title][] = $url;
}
}
if ($count > 0) {
return true;
}
$this->error = 'No git:// clone URL found';
return false;
}
/**
* Iterate through all git urls and return one if there is only
* one supported one.
*
* @return mixed Boolean false or string
*/
public function getUniqueGitUrl()
{
$nFound = 0;
foreach ($this->arGitUrls as $title => $arUrls) {
foreach ($arUrls as $url) {
$nFound++;
$uniqueUrl = $url;
}
}
if ($nFound == 1) {
return $uniqueUrl;
}
return false;
}
public function getGitUrls()
{
return $this->arGitUrls;
}
/**
* Get the URL from which the git URL was derived, often
* the HTTP URL.
*
* @return string
*/
public function getUrl()
{
return $this->url;
}
public function setUrl($url)
{
$this->url = $url;
}
public function isSupported($url)
{
return parse_url($url, PHP_URL_SCHEME) == 'git';
}
}
?>