| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222 | <?php/* * This file is part of the Symfony package. * * (c) Fabien Potencier <fabien@symfony.com> * * For the full copyright and license information, please view the LICENSE * file that was distributed with this source code. */namespace Symfony\Component\DomCrawler;/** * Link represents an HTML link (an HTML a, area or link tag). * * @author Fabien Potencier <fabien@symfony.com> */class Link{    /**     * @var \DOMElement     */    protected $node;    /**     * @var string The method to use for the link     */    protected $method;    /**     * @var string The URI of the page where the link is embedded (or the base href)     */    protected $currentUri;    /**     * @param \DOMElement $node       A \DOMElement instance     * @param string      $currentUri The URI of the page where the link is embedded (or the base href)     * @param string      $method     The method to use for the link (get by default)     *     * @throws \InvalidArgumentException if the node is not a link     */    public function __construct(\DOMElement $node, $currentUri, $method = 'GET')    {        if (!\in_array(strtolower(substr($currentUri, 0, 4)), array('http', 'file'))) {            throw new \InvalidArgumentException(sprintf('Current URI must be an absolute URL ("%s").', $currentUri));        }        $this->setNode($node);        $this->method = $method ? strtoupper($method) : null;        $this->currentUri = $currentUri;    }    /**     * Gets the node associated with this link.     *     * @return \DOMElement A \DOMElement instance     */    public function getNode()    {        return $this->node;    }    /**     * Gets the method associated with this link.     *     * @return string The method     */    public function getMethod()    {        return $this->method;    }    /**     * Gets the URI associated with this link.     *     * @return string The URI     */    public function getUri()    {        $uri = trim($this->getRawUri());        // absolute URL?        if (null !== parse_url($uri, PHP_URL_SCHEME)) {            return $uri;        }        // empty URI        if (!$uri) {            return $this->currentUri;        }        // an anchor        if ('#' === $uri[0]) {            return $this->cleanupAnchor($this->currentUri).$uri;        }        $baseUri = $this->cleanupUri($this->currentUri);        if ('?' === $uri[0]) {            return $baseUri.$uri;        }        // absolute URL with relative schema        if (0 === strpos($uri, '//')) {            return preg_replace('#^([^/]*)//.*$#', '$1', $baseUri).$uri;        }        $baseUri = preg_replace('#^(.*?//[^/]*)(?:\/.*)?$#', '$1', $baseUri);        // absolute path        if ('/' === $uri[0]) {            return $baseUri.$uri;        }        // relative path        $path = parse_url(substr($this->currentUri, \strlen($baseUri)), PHP_URL_PATH);        $path = $this->canonicalizePath(substr($path, 0, strrpos($path, '/')).'/'.$uri);        return $baseUri.('' === $path || '/' !== $path[0] ? '/' : '').$path;    }    /**     * Returns raw URI data.     *     * @return string     */    protected function getRawUri()    {        return $this->node->getAttribute('href');    }    /**     * Returns the canonicalized URI path (see RFC 3986, section 5.2.4).     *     * @param string $path URI path     *     * @return string     */    protected function canonicalizePath($path)    {        if ('' === $path || '/' === $path) {            return $path;        }        if ('.' === substr($path, -1)) {            $path .= '/';        }        $output = array();        foreach (explode('/', $path) as $segment) {            if ('..' === $segment) {                array_pop($output);            } elseif ('.' !== $segment) {                $output[] = $segment;            }        }        return implode('/', $output);    }    /**     * Sets current \DOMElement instance.     *     * @param \DOMElement $node A \DOMElement instance     *     * @throws \LogicException If given node is not an anchor     */    protected function setNode(\DOMElement $node)    {        if ('a' !== $node->nodeName && 'area' !== $node->nodeName && 'link' !== $node->nodeName) {            throw new \LogicException(sprintf('Unable to navigate from a "%s" tag.', $node->nodeName));        }        $this->node = $node;    }    /**     * Removes the query string and the anchor from the given uri.     *     * @param string $uri The uri to clean     *     * @return string     */    private function cleanupUri($uri)    {        return $this->cleanupQuery($this->cleanupAnchor($uri));    }    /**     * Remove the query string from the uri.     *     * @param string $uri     *     * @return string     */    private function cleanupQuery($uri)    {        if (false !== $pos = strpos($uri, '?')) {            return substr($uri, 0, $pos);        }        return $uri;    }    /**     * Remove the anchor from the uri.     *     * @param string $uri     *     * @return string     */    private function cleanupAnchor($uri)    {        if (false !== $pos = strpos($uri, '#')) {            return substr($uri, 0, $pos);        }        return $uri;    }}
 |