123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136 |
- <?php
- /*
- * This file is part of the Symfony package.
- *
- * (c) Fabien Potencier <fabien@symfony.com>
- *
- * For the full copyright and license information, please view the LICENSE
- * file that was distributed with this source code.
- */
- namespace Symfony\Component\DomCrawler;
- /**
- * The UriResolver class takes an URI (relative, absolute, fragment, etc.)
- * and turns it into an absolute URI against another given base URI.
- *
- * @author Fabien Potencier <fabien@symfony.com>
- * @author Grégoire Pineau <lyrixx@lyrixx.info>
- */
- class UriResolver
- {
- /**
- * Resolves a URI according to a base URI.
- *
- * For example if $uri=/foo/bar and $baseUri=https://symfony.com it will
- * return https://symfony.com/foo/bar
- *
- * If the $uri is not absolute you must pass an absolute $baseUri
- */
- public static function resolve(string $uri, ?string $baseUri): string
- {
- $uri = trim($uri);
- // absolute URL?
- if (null !== parse_url($uri, \PHP_URL_SCHEME)) {
- return $uri;
- }
- if (null === $baseUri) {
- throw new \InvalidArgumentException('The URI is relative, so you must define its base URI passing an absolute URL.');
- }
- // empty URI
- if (!$uri) {
- return $baseUri;
- }
- // an anchor
- if ('#' === $uri[0]) {
- return self::cleanupAnchor($baseUri).$uri;
- }
- $baseUriCleaned = self::cleanupUri($baseUri);
- if ('?' === $uri[0]) {
- return $baseUriCleaned.$uri;
- }
- // absolute URL with relative schema
- if (0 === strpos($uri, '//')) {
- return preg_replace('#^([^/]*)//.*$#', '$1', $baseUriCleaned).$uri;
- }
- $baseUriCleaned = preg_replace('#^(.*?//[^/]*)(?:\/.*)?$#', '$1', $baseUriCleaned);
- // absolute path
- if ('/' === $uri[0]) {
- return $baseUriCleaned.$uri;
- }
- // relative path
- $path = parse_url(substr($baseUri, \strlen($baseUriCleaned)), \PHP_URL_PATH);
- $path = self::canonicalizePath(substr($path, 0, strrpos($path, '/')).'/'.$uri);
- return $baseUriCleaned.('' === $path || '/' !== $path[0] ? '/' : '').$path;
- }
- /**
- * Returns the canonicalized URI path (see RFC 3986, section 5.2.4).
- */
- private static function canonicalizePath(string $path): string
- {
- if ('' === $path || '/' === $path) {
- return $path;
- }
- if ('.' === substr($path, -1)) {
- $path .= '/';
- }
- $output = [];
- foreach (explode('/', $path) as $segment) {
- if ('..' === $segment) {
- array_pop($output);
- } elseif ('.' !== $segment) {
- $output[] = $segment;
- }
- }
- return implode('/', $output);
- }
- /**
- * Removes the query string and the anchor from the given uri.
- */
- private static function cleanupUri(string $uri): string
- {
- return self::cleanupQuery(self::cleanupAnchor($uri));
- }
- /**
- * Removes the query string from the uri.
- */
- private static function cleanupQuery(string $uri): string
- {
- if (false !== $pos = strpos($uri, '?')) {
- return substr($uri, 0, $pos);
- }
- return $uri;
- }
- /**
- * Removes the anchor from the uri.
- */
- private static function cleanupAnchor(string $uri): string
- {
- if (false !== $pos = strpos($uri, '#')) {
- return substr($uri, 0, $pos);
- }
- return $uri;
- }
- }
|