You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
212 lines
5.2 KiB
212 lines
5.2 KiB
<?php |
|
|
|
/* |
|
* This file is part of the Symfony package. |
|
* |
|
* (c) Fabien Potencier <fabien@symfony.com> |
|
* |
|
* For the full copyright and license information, please view the LICENSE |
|
* file that was distributed with this source code. |
|
*/ |
|
|
|
namespace Symfony\Component\DomCrawler; |
|
|
|
/** |
|
* Any HTML element that can link to an URI. |
|
* |
|
* @author Fabien Potencier <fabien@symfony.com> |
|
*/ |
|
abstract class AbstractUriElement |
|
{ |
|
/** |
|
* @var \DOMElement |
|
*/ |
|
protected $node; |
|
|
|
/** |
|
* @var string The method to use for the element |
|
*/ |
|
protected $method; |
|
|
|
/** |
|
* @var string The URI of the page where the element is embedded (or the base href) |
|
*/ |
|
protected $currentUri; |
|
|
|
/** |
|
* @param \DOMElement $node A \DOMElement instance |
|
* @param string $currentUri The URI of the page where the link is embedded (or the base href) |
|
* @param string $method The method to use for the link (get by default) |
|
* |
|
* @throws \InvalidArgumentException if the node is not a link |
|
*/ |
|
public function __construct(\DOMElement $node, $currentUri, $method = 'GET') |
|
{ |
|
if (!in_array(strtolower(substr($currentUri, 0, 4)), array('http', 'file'))) { |
|
throw new \InvalidArgumentException(sprintf('Current URI must be an absolute URL ("%s").', $currentUri)); |
|
} |
|
|
|
$this->setNode($node); |
|
$this->method = $method ? strtoupper($method) : null; |
|
$this->currentUri = $currentUri; |
|
} |
|
|
|
/** |
|
* Gets the node associated with this link. |
|
* |
|
* @return \DOMElement A \DOMElement instance |
|
*/ |
|
public function getNode() |
|
{ |
|
return $this->node; |
|
} |
|
|
|
/** |
|
* Gets the method associated with this link. |
|
* |
|
* @return string The method |
|
*/ |
|
public function getMethod() |
|
{ |
|
return $this->method; |
|
} |
|
|
|
/** |
|
* Gets the URI associated with this link. |
|
* |
|
* @return string The URI |
|
*/ |
|
public function getUri() |
|
{ |
|
$uri = trim($this->getRawUri()); |
|
|
|
// absolute URL? |
|
if (null !== parse_url($uri, PHP_URL_SCHEME)) { |
|
return $uri; |
|
} |
|
|
|
// empty URI |
|
if (!$uri) { |
|
return $this->currentUri; |
|
} |
|
|
|
// an anchor |
|
if ('#' === $uri[0]) { |
|
return $this->cleanupAnchor($this->currentUri).$uri; |
|
} |
|
|
|
$baseUri = $this->cleanupUri($this->currentUri); |
|
|
|
if ('?' === $uri[0]) { |
|
return $baseUri.$uri; |
|
} |
|
|
|
// absolute URL with relative schema |
|
if (0 === strpos($uri, '//')) { |
|
return preg_replace('#^([^/]*)//.*$#', '$1', $baseUri).$uri; |
|
} |
|
|
|
$baseUri = preg_replace('#^(.*?//[^/]*)(?:\/.*)?$#', '$1', $baseUri); |
|
|
|
// absolute path |
|
if ('/' === $uri[0]) { |
|
return $baseUri.$uri; |
|
} |
|
|
|
// relative path |
|
$path = parse_url(substr($this->currentUri, strlen($baseUri)), PHP_URL_PATH); |
|
$path = $this->canonicalizePath(substr($path, 0, strrpos($path, '/')).'/'.$uri); |
|
|
|
return $baseUri.('' === $path || '/' !== $path[0] ? '/' : '').$path; |
|
} |
|
|
|
/** |
|
* Returns raw URI data. |
|
* |
|
* @return string |
|
*/ |
|
abstract protected function getRawUri(); |
|
|
|
/** |
|
* Returns the canonicalized URI path (see RFC 3986, section 5.2.4). |
|
* |
|
* @param string $path URI path |
|
* |
|
* @return string |
|
*/ |
|
protected function canonicalizePath($path) |
|
{ |
|
if ('' === $path || '/' === $path) { |
|
return $path; |
|
} |
|
|
|
if ('.' === substr($path, -1)) { |
|
$path .= '/'; |
|
} |
|
|
|
$output = array(); |
|
|
|
foreach (explode('/', $path) as $segment) { |
|
if ('..' === $segment) { |
|
array_pop($output); |
|
} elseif ('.' !== $segment) { |
|
$output[] = $segment; |
|
} |
|
} |
|
|
|
return implode('/', $output); |
|
} |
|
|
|
/** |
|
* Sets current \DOMElement instance. |
|
* |
|
* @param \DOMElement $node A \DOMElement instance |
|
* |
|
* @throws \LogicException If given node is not an anchor |
|
*/ |
|
abstract protected function setNode(\DOMElement $node); |
|
|
|
/** |
|
* Removes the query string and the anchor from the given uri. |
|
* |
|
* @param string $uri The uri to clean |
|
* |
|
* @return string |
|
*/ |
|
private function cleanupUri($uri) |
|
{ |
|
return $this->cleanupQuery($this->cleanupAnchor($uri)); |
|
} |
|
|
|
/** |
|
* Remove the query string from the uri. |
|
* |
|
* @param string $uri |
|
* |
|
* @return string |
|
*/ |
|
private function cleanupQuery($uri) |
|
{ |
|
if (false !== $pos = strpos($uri, '?')) { |
|
return substr($uri, 0, $pos); |
|
} |
|
|
|
return $uri; |
|
} |
|
|
|
/** |
|
* Remove the anchor from the uri. |
|
* |
|
* @param string $uri |
|
* |
|
* @return string |
|
*/ |
|
private function cleanupAnchor($uri) |
|
{ |
|
if (false !== $pos = strpos($uri, '#')) { |
|
return substr($uri, 0, $pos); |
|
} |
|
|
|
return $uri; |
|
} |
|
}
|
|
|