mirror of
https://github.com/torrentpier/torrentpier-lts.git
synced 2025-03-01 15:21:02 +03:00
1360 lines
37 KiB
PHP
1360 lines
37 KiB
PHP
<?php
|
|
/**
|
|
* Zend Framework (http://framework.zend.com/)
|
|
*
|
|
* @link http://github.com/zendframework/zf2 for the canonical source repository
|
|
* @copyright Copyright (c) 2005-2014 Zend Technologies USA Inc. (http://www.zend.com)
|
|
* @license http://framework.zend.com/license/new-bsd New BSD License
|
|
*/
|
|
|
|
namespace Zend\Uri;
|
|
|
|
use Zend\Escaper\Escaper;
|
|
use Zend\Validator;
|
|
|
|
/**
|
|
* Generic URI handler
|
|
*/
|
|
class Uri implements UriInterface
|
|
{
|
|
/**
|
|
* Character classes defined in RFC-3986
|
|
*/
|
|
const CHAR_UNRESERVED = 'a-zA-Z0-9_\-\.~';
|
|
const CHAR_GEN_DELIMS = ':\/\?#\[\]@';
|
|
const CHAR_SUB_DELIMS = '!\$&\'\(\)\*\+,;=';
|
|
const CHAR_RESERVED = ':\/\?#\[\]@!\$&\'\(\)\*\+,;=';
|
|
/**
|
|
* Not in the spec - those characters have special meaning in urlencoded query parameters
|
|
*/
|
|
const CHAR_QUERY_DELIMS = '!\$\'\(\)\*\,';
|
|
|
|
/**
|
|
* Host part types represented as binary masks
|
|
* The binary mask consists of 5 bits in the following order:
|
|
* <RegName> | <DNS> | <IPvFuture> | <IPv6> | <IPv4>
|
|
* Place 1 or 0 in the different positions for enable or disable the part.
|
|
* Finally use a hexadecimal representation.
|
|
*/
|
|
const HOST_IPV4 = 0x01; //00001
|
|
const HOST_IPV6 = 0x02; //00010
|
|
const HOST_IPVFUTURE = 0x04; //00100
|
|
const HOST_IPVANY = 0x07; //00111
|
|
const HOST_DNS = 0x08; //01000
|
|
const HOST_DNS_OR_IPV4 = 0x09; //01001
|
|
const HOST_DNS_OR_IPV6 = 0x0A; //01010
|
|
const HOST_DNS_OR_IPV4_OR_IPV6 = 0x0B; //01011
|
|
const HOST_DNS_OR_IPVANY = 0x0F; //01111
|
|
const HOST_REGNAME = 0x10; //10000
|
|
const HOST_DNS_OR_IPV4_OR_IPV6_OR_REGNAME = 0x13; //10011
|
|
const HOST_ALL = 0x1F; //11111
|
|
|
|
/**
|
|
* URI scheme
|
|
*
|
|
* @var string
|
|
*/
|
|
protected $scheme;
|
|
|
|
/**
|
|
* URI userInfo part (usually user:password in HTTP URLs)
|
|
*
|
|
* @var string
|
|
*/
|
|
protected $userInfo;
|
|
|
|
/**
|
|
* URI hostname
|
|
*
|
|
* @var string
|
|
*/
|
|
protected $host;
|
|
|
|
/**
|
|
* URI port
|
|
*
|
|
* @var int
|
|
*/
|
|
protected $port;
|
|
|
|
/**
|
|
* URI path
|
|
*
|
|
* @var string
|
|
*/
|
|
protected $path;
|
|
|
|
/**
|
|
* URI query string
|
|
*
|
|
* @var string
|
|
*/
|
|
protected $query;
|
|
|
|
/**
|
|
* URI fragment
|
|
*
|
|
* @var string
|
|
*/
|
|
protected $fragment;
|
|
|
|
/**
|
|
* Which host part types are valid for this URI?
|
|
*
|
|
* @var int
|
|
*/
|
|
protected $validHostTypes = self::HOST_ALL;
|
|
|
|
/**
|
|
* Array of valid schemes.
|
|
*
|
|
* Subclasses of this class that only accept specific schemes may set the
|
|
* list of accepted schemes here. If not empty, when setScheme() is called
|
|
* it will only accept the schemes listed here.
|
|
*
|
|
* @var array
|
|
*/
|
|
protected static $validSchemes = array();
|
|
|
|
/**
|
|
* List of default ports per scheme
|
|
*
|
|
* Inheriting URI classes may set this, and the normalization methods will
|
|
* automatically remove the port if it is equal to the default port for the
|
|
* current scheme
|
|
*
|
|
* @var array
|
|
*/
|
|
protected static $defaultPorts = array();
|
|
|
|
/**
|
|
* @var Escaper
|
|
*/
|
|
protected static $escaper;
|
|
|
|
/**
|
|
* Create a new URI object
|
|
*
|
|
* @param Uri|string|null $uri
|
|
* @throws Exception\InvalidArgumentException
|
|
*/
|
|
public function __construct($uri = null)
|
|
{
|
|
if (is_string($uri)) {
|
|
$this->parse($uri);
|
|
} elseif ($uri instanceof UriInterface) {
|
|
// Copy constructor
|
|
$this->setScheme($uri->getScheme());
|
|
$this->setUserInfo($uri->getUserInfo());
|
|
$this->setHost($uri->getHost());
|
|
$this->setPort($uri->getPort());
|
|
$this->setPath($uri->getPath());
|
|
$this->setQuery($uri->getQuery());
|
|
$this->setFragment($uri->getFragment());
|
|
} elseif ($uri !== null) {
|
|
throw new Exception\InvalidArgumentException(sprintf(
|
|
'Expecting a string or a URI object, received "%s"',
|
|
(is_object($uri) ? get_class($uri) : gettype($uri))
|
|
));
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Set Escaper instance
|
|
*
|
|
* @param Escaper $escaper
|
|
*/
|
|
public static function setEscaper(Escaper $escaper)
|
|
{
|
|
static::$escaper = $escaper;
|
|
}
|
|
|
|
/**
|
|
* Retrieve Escaper instance
|
|
*
|
|
* Lazy-loads one if none provided
|
|
*
|
|
* @return Escaper
|
|
*/
|
|
public static function getEscaper()
|
|
{
|
|
if (null === static::$escaper) {
|
|
static::setEscaper(new Escaper());
|
|
}
|
|
return static::$escaper;
|
|
}
|
|
|
|
/**
|
|
* Check if the URI is valid
|
|
*
|
|
* Note that a relative URI may still be valid
|
|
*
|
|
* @return bool
|
|
*/
|
|
public function isValid()
|
|
{
|
|
if ($this->host) {
|
|
if (strlen($this->path) > 0 && substr($this->path, 0, 1) != '/') {
|
|
return false;
|
|
}
|
|
return true;
|
|
}
|
|
|
|
if ($this->userInfo || $this->port) {
|
|
return false;
|
|
}
|
|
|
|
if ($this->path) {
|
|
// Check path-only (no host) URI
|
|
if (substr($this->path, 0, 2) == '//') {
|
|
return false;
|
|
}
|
|
return true;
|
|
}
|
|
|
|
if (! ($this->query || $this->fragment)) {
|
|
// No host, path, query or fragment - this is not a valid URI
|
|
return false;
|
|
}
|
|
|
|
return true;
|
|
}
|
|
|
|
/**
|
|
* Check if the URI is a valid relative URI
|
|
*
|
|
* @return bool
|
|
*/
|
|
public function isValidRelative()
|
|
{
|
|
if ($this->scheme || $this->host || $this->userInfo || $this->port) {
|
|
return false;
|
|
}
|
|
|
|
if ($this->path) {
|
|
// Check path-only (no host) URI
|
|
if (substr($this->path, 0, 2) == '//') {
|
|
return false;
|
|
}
|
|
return true;
|
|
}
|
|
|
|
if (! ($this->query || $this->fragment)) {
|
|
// No host, path, query or fragment - this is not a valid URI
|
|
return false;
|
|
}
|
|
|
|
return true;
|
|
}
|
|
|
|
/**
|
|
* Check if the URI is an absolute or relative URI
|
|
*
|
|
* @return bool
|
|
*/
|
|
public function isAbsolute()
|
|
{
|
|
return ($this->scheme !== null);
|
|
}
|
|
|
|
/**
|
|
* Reset URI parts
|
|
*/
|
|
protected function reset()
|
|
{
|
|
$this->setScheme(null);
|
|
$this->setPort(null);
|
|
$this->setUserInfo(null);
|
|
$this->setHost(null);
|
|
$this->setPath(null);
|
|
$this->setFragment(null);
|
|
$this->setQuery(null);
|
|
}
|
|
|
|
/**
|
|
* Parse a URI string
|
|
*
|
|
* @param string $uri
|
|
* @return Uri
|
|
*/
|
|
public function parse($uri)
|
|
{
|
|
$this->reset();
|
|
|
|
// Capture scheme
|
|
if (($scheme = self::parseScheme($uri)) !== null) {
|
|
$this->setScheme($scheme);
|
|
$uri = substr($uri, strlen($scheme) + 1);
|
|
}
|
|
|
|
// Capture authority part
|
|
if (preg_match('|^//([^/\?#]*)|', $uri, $match)) {
|
|
$authority = $match[1];
|
|
$uri = substr($uri, strlen($match[0]));
|
|
|
|
// Split authority into userInfo and host
|
|
if (strpos($authority, '@') !== false) {
|
|
// The userInfo can also contain '@' symbols; split $authority
|
|
// into segments, and set it to the last segment.
|
|
$segments = explode('@', $authority);
|
|
$authority = array_pop($segments);
|
|
$userInfo = implode('@', $segments);
|
|
unset($segments);
|
|
$this->setUserInfo($userInfo);
|
|
}
|
|
|
|
$nMatches = preg_match('/:[\d]{1,5}$/', $authority, $matches);
|
|
if ($nMatches === 1) {
|
|
$portLength = strlen($matches[0]);
|
|
$port = substr($matches[0], 1);
|
|
|
|
$this->setPort((int) $port);
|
|
$authority = substr($authority, 0, -$portLength);
|
|
}
|
|
|
|
$this->setHost($authority);
|
|
}
|
|
|
|
if (!$uri) {
|
|
return $this;
|
|
}
|
|
|
|
// Capture the path
|
|
if (preg_match('|^[^\?#]*|', $uri, $match)) {
|
|
$this->setPath($match[0]);
|
|
$uri = substr($uri, strlen($match[0]));
|
|
}
|
|
|
|
if (!$uri) {
|
|
return $this;
|
|
}
|
|
|
|
// Capture the query
|
|
if (preg_match('|^\?([^#]*)|', $uri, $match)) {
|
|
$this->setQuery($match[1]);
|
|
$uri = substr($uri, strlen($match[0]));
|
|
}
|
|
if (!$uri) {
|
|
return $this;
|
|
}
|
|
|
|
// All that's left is the fragment
|
|
if ($uri && substr($uri, 0, 1) == '#') {
|
|
$this->setFragment(substr($uri, 1));
|
|
}
|
|
|
|
return $this;
|
|
}
|
|
|
|
/**
|
|
* Compose the URI into a string
|
|
*
|
|
* @return string
|
|
* @throws Exception\InvalidUriException
|
|
*/
|
|
public function toString()
|
|
{
|
|
if (!$this->isValid()) {
|
|
if ($this->isAbsolute() || !$this->isValidRelative()) {
|
|
throw new Exception\InvalidUriException(
|
|
'URI is not valid and cannot be converted into a string'
|
|
);
|
|
}
|
|
}
|
|
|
|
$uri = '';
|
|
|
|
if ($this->scheme) {
|
|
$uri .= $this->scheme . ':';
|
|
}
|
|
|
|
if ($this->host !== null) {
|
|
$uri .= '//';
|
|
if ($this->userInfo) {
|
|
$uri .= $this->userInfo . '@';
|
|
}
|
|
$uri .= $this->host;
|
|
if ($this->port) {
|
|
$uri .= ':' . $this->port;
|
|
}
|
|
}
|
|
|
|
if ($this->path) {
|
|
$uri .= static::encodePath($this->path);
|
|
} elseif ($this->host && ($this->query || $this->fragment)) {
|
|
$uri .= '/';
|
|
}
|
|
|
|
if ($this->query) {
|
|
$uri .= "?" . static::encodeQueryFragment($this->query);
|
|
}
|
|
|
|
if ($this->fragment) {
|
|
$uri .= "#" . static::encodeQueryFragment($this->fragment);
|
|
}
|
|
|
|
return $uri;
|
|
}
|
|
|
|
/**
|
|
* Normalize the URI
|
|
*
|
|
* Normalizing a URI includes removing any redundant parent directory or
|
|
* current directory references from the path (e.g. foo/bar/../baz becomes
|
|
* foo/baz), normalizing the scheme case, decoding any over-encoded
|
|
* characters etc.
|
|
*
|
|
* Eventually, two normalized URLs pointing to the same resource should be
|
|
* equal even if they were originally represented by two different strings
|
|
*
|
|
* @return Uri
|
|
*/
|
|
public function normalize()
|
|
{
|
|
if ($this->scheme) {
|
|
$this->scheme = static::normalizeScheme($this->scheme);
|
|
}
|
|
|
|
if ($this->host) {
|
|
$this->host = static::normalizeHost($this->host);
|
|
}
|
|
|
|
if ($this->port) {
|
|
$this->port = static::normalizePort($this->port, $this->scheme);
|
|
}
|
|
|
|
if ($this->path) {
|
|
$this->path = static::normalizePath($this->path);
|
|
}
|
|
|
|
if ($this->query) {
|
|
$this->query = static::normalizeQuery($this->query);
|
|
}
|
|
|
|
if ($this->fragment) {
|
|
$this->fragment = static::normalizeFragment($this->fragment);
|
|
}
|
|
|
|
// If path is empty (and we have a host), path should be '/'
|
|
// Isn't this valid ONLY for HTTP-URI?
|
|
if ($this->host && empty($this->path)) {
|
|
$this->path = '/';
|
|
}
|
|
|
|
return $this;
|
|
}
|
|
|
|
/**
|
|
* Convert a relative URI into an absolute URI using a base absolute URI as
|
|
* a reference.
|
|
*
|
|
* This is similar to merge() - only it uses the supplied URI as the
|
|
* base reference instead of using the current URI as the base reference.
|
|
*
|
|
* Merging algorithm is adapted from RFC-3986 section 5.2
|
|
* (@link http://tools.ietf.org/html/rfc3986#section-5.2)
|
|
*
|
|
* @param Uri|string $baseUri
|
|
* @throws Exception\InvalidArgumentException
|
|
* @return Uri
|
|
*/
|
|
public function resolve($baseUri)
|
|
{
|
|
// Ignore if URI is absolute
|
|
if ($this->isAbsolute()) {
|
|
return $this;
|
|
}
|
|
|
|
if (is_string($baseUri)) {
|
|
$baseUri = new static($baseUri);
|
|
} elseif (!$baseUri instanceof Uri) {
|
|
throw new Exception\InvalidArgumentException(
|
|
'Provided base URI must be a string or a Uri object'
|
|
);
|
|
}
|
|
|
|
// Merging starts here...
|
|
if ($this->getHost()) {
|
|
$this->setPath(static::removePathDotSegments($this->getPath()));
|
|
} else {
|
|
$basePath = $baseUri->getPath();
|
|
$relPath = $this->getPath();
|
|
if (!$relPath) {
|
|
$this->setPath($basePath);
|
|
if (!$this->getQuery()) {
|
|
$this->setQuery($baseUri->getQuery());
|
|
}
|
|
} else {
|
|
if (substr($relPath, 0, 1) == '/') {
|
|
$this->setPath(static::removePathDotSegments($relPath));
|
|
} else {
|
|
if ($baseUri->getHost() && !$basePath) {
|
|
$mergedPath = '/';
|
|
} else {
|
|
$mergedPath = substr($basePath, 0, strrpos($basePath, '/') + 1);
|
|
}
|
|
$this->setPath(static::removePathDotSegments($mergedPath . $relPath));
|
|
}
|
|
}
|
|
|
|
// Set the authority part
|
|
$this->setUserInfo($baseUri->getUserInfo());
|
|
$this->setHost($baseUri->getHost());
|
|
$this->setPort($baseUri->getPort());
|
|
}
|
|
|
|
$this->setScheme($baseUri->getScheme());
|
|
return $this;
|
|
}
|
|
|
|
|
|
/**
|
|
* Convert the link to a relative link by substracting a base URI
|
|
*
|
|
* This is the opposite of resolving a relative link - i.e. creating a
|
|
* relative reference link from an original URI and a base URI.
|
|
*
|
|
* If the two URIs do not intersect (e.g. the original URI is not in any
|
|
* way related to the base URI) the URI will not be modified.
|
|
*
|
|
* @param Uri|string $baseUri
|
|
* @return Uri
|
|
*/
|
|
public function makeRelative($baseUri)
|
|
{
|
|
// Copy base URI, we should not modify it
|
|
$baseUri = new static($baseUri);
|
|
|
|
$this->normalize();
|
|
$baseUri->normalize();
|
|
|
|
$host = $this->getHost();
|
|
$baseHost = $baseUri->getHost();
|
|
if ($host && $baseHost && ($host != $baseHost)) {
|
|
// Not the same hostname
|
|
return $this;
|
|
}
|
|
|
|
$port = $this->getPort();
|
|
$basePort = $baseUri->getPort();
|
|
if ($port && $basePort && ($port != $basePort)) {
|
|
// Not the same port
|
|
return $this;
|
|
}
|
|
|
|
$scheme = $this->getScheme();
|
|
$baseScheme = $baseUri->getScheme();
|
|
if ($scheme && $baseScheme && ($scheme != $baseScheme)) {
|
|
// Not the same scheme (e.g. HTTP vs. HTTPS)
|
|
return $this;
|
|
}
|
|
|
|
// Remove host, port and scheme
|
|
$this->setHost(null)
|
|
->setPort(null)
|
|
->setScheme(null);
|
|
|
|
// Is path the same?
|
|
if ($this->getPath() == $baseUri->getPath()) {
|
|
$this->setPath('');
|
|
return $this;
|
|
}
|
|
|
|
$pathParts = preg_split('|(/)|', $this->getPath(), null,
|
|
PREG_SPLIT_DELIM_CAPTURE | PREG_SPLIT_NO_EMPTY);
|
|
$baseParts = preg_split('|(/)|', $baseUri->getPath(), null,
|
|
PREG_SPLIT_DELIM_CAPTURE | PREG_SPLIT_NO_EMPTY);
|
|
|
|
// Get the intersection of existing path parts and those from the
|
|
// provided URI
|
|
$matchingParts = array_intersect_assoc($pathParts, $baseParts);
|
|
|
|
// Loop through the matches
|
|
foreach ($matchingParts as $index => $segment) {
|
|
// If we skip an index at any point, we have parent traversal, and
|
|
// need to prepend the path accordingly
|
|
if ($index && !isset($matchingParts[$index - 1])) {
|
|
array_unshift($pathParts, '../');
|
|
continue;
|
|
}
|
|
|
|
// Otherwise, we simply unset the given path segment
|
|
unset($pathParts[$index]);
|
|
}
|
|
|
|
// Reset the path by imploding path segments
|
|
$this->setPath(implode($pathParts));
|
|
|
|
return $this;
|
|
}
|
|
|
|
/**
|
|
* Get the scheme part of the URI
|
|
*
|
|
* @return string|null
|
|
*/
|
|
public function getScheme()
|
|
{
|
|
return $this->scheme;
|
|
}
|
|
|
|
/**
|
|
* Get the User-info (usually user:password) part
|
|
*
|
|
* @return string|null
|
|
*/
|
|
public function getUserInfo()
|
|
{
|
|
return $this->userInfo;
|
|
}
|
|
|
|
/**
|
|
* Get the URI host
|
|
*
|
|
* @return string|null
|
|
*/
|
|
public function getHost()
|
|
{
|
|
return $this->host;
|
|
}
|
|
|
|
/**
|
|
* Get the URI port
|
|
*
|
|
* @return int|null
|
|
*/
|
|
public function getPort()
|
|
{
|
|
return $this->port;
|
|
}
|
|
|
|
/**
|
|
* Get the URI path
|
|
*
|
|
* @return string|null
|
|
*/
|
|
public function getPath()
|
|
{
|
|
return $this->path;
|
|
}
|
|
|
|
/**
|
|
* Get the URI query
|
|
*
|
|
* @return string|null
|
|
*/
|
|
public function getQuery()
|
|
{
|
|
return $this->query;
|
|
}
|
|
|
|
/**
|
|
* Return the query string as an associative array of key => value pairs
|
|
*
|
|
* This is an extension to RFC-3986 but is quite useful when working with
|
|
* most common URI types
|
|
*
|
|
* @return array
|
|
*/
|
|
public function getQueryAsArray()
|
|
{
|
|
$query = array();
|
|
if ($this->query) {
|
|
parse_str($this->query, $query);
|
|
}
|
|
|
|
return $query;
|
|
}
|
|
|
|
/**
|
|
* Get the URI fragment
|
|
*
|
|
* @return string|null
|
|
*/
|
|
public function getFragment()
|
|
{
|
|
return $this->fragment;
|
|
}
|
|
|
|
/**
|
|
* Set the URI scheme
|
|
*
|
|
* If the scheme is not valid according to the generic scheme syntax or
|
|
* is not acceptable by the specific URI class (e.g. 'http' or 'https' are
|
|
* the only acceptable schemes for the Zend\Uri\Http class) an exception
|
|
* will be thrown.
|
|
*
|
|
* You can check if a scheme is valid before setting it using the
|
|
* validateScheme() method.
|
|
*
|
|
* @param string $scheme
|
|
* @throws Exception\InvalidUriPartException
|
|
* @return Uri
|
|
*/
|
|
public function setScheme($scheme)
|
|
{
|
|
if (($scheme !== null) && (!self::validateScheme($scheme))) {
|
|
throw new Exception\InvalidUriPartException(sprintf(
|
|
'Scheme "%s" is not valid or is not accepted by %s',
|
|
$scheme,
|
|
get_class($this)
|
|
), Exception\InvalidUriPartException::INVALID_SCHEME);
|
|
}
|
|
|
|
$this->scheme = $scheme;
|
|
return $this;
|
|
}
|
|
|
|
/**
|
|
* Set the URI User-info part (usually user:password)
|
|
*
|
|
* @param string $userInfo
|
|
* @return Uri
|
|
* @throws Exception\InvalidUriPartException If the schema definition
|
|
* does not have this part
|
|
*/
|
|
public function setUserInfo($userInfo)
|
|
{
|
|
$this->userInfo = $userInfo;
|
|
return $this;
|
|
}
|
|
|
|
/**
|
|
* Set the URI host
|
|
*
|
|
* Note that the generic syntax for URIs allows using host names which
|
|
* are not necessarily IPv4 addresses or valid DNS host names. For example,
|
|
* IPv6 addresses are allowed as well, and also an abstract "registered name"
|
|
* which may be any name composed of a valid set of characters, including,
|
|
* for example, tilda (~) and underscore (_) which are not allowed in DNS
|
|
* names.
|
|
*
|
|
* Subclasses of Uri may impose more strict validation of host names - for
|
|
* example the HTTP RFC clearly states that only IPv4 and valid DNS names
|
|
* are allowed in HTTP URIs.
|
|
*
|
|
* @param string $host
|
|
* @throws Exception\InvalidUriPartException
|
|
* @return Uri
|
|
*/
|
|
public function setHost($host)
|
|
{
|
|
if (($host !== '')
|
|
&& ($host !== null)
|
|
&& !self::validateHost($host, $this->validHostTypes)
|
|
) {
|
|
throw new Exception\InvalidUriPartException(sprintf(
|
|
'Host "%s" is not valid or is not accepted by %s',
|
|
$host,
|
|
get_class($this)
|
|
), Exception\InvalidUriPartException::INVALID_HOSTNAME);
|
|
}
|
|
|
|
$this->host = $host;
|
|
return $this;
|
|
}
|
|
|
|
/**
|
|
* Set the port part of the URI
|
|
*
|
|
* @param int $port
|
|
* @return Uri
|
|
*/
|
|
public function setPort($port)
|
|
{
|
|
$this->port = $port;
|
|
return $this;
|
|
}
|
|
|
|
/**
|
|
* Set the path
|
|
*
|
|
* @param string $path
|
|
* @return Uri
|
|
*/
|
|
public function setPath($path)
|
|
{
|
|
$this->path = $path;
|
|
return $this;
|
|
}
|
|
|
|
/**
|
|
* Set the query string
|
|
*
|
|
* If an array is provided, will encode this array of parameters into a
|
|
* query string. Array values will be represented in the query string using
|
|
* PHP's common square bracket notation.
|
|
*
|
|
* @param string|array $query
|
|
* @return Uri
|
|
*/
|
|
public function setQuery($query)
|
|
{
|
|
if (is_array($query)) {
|
|
// We replace the + used for spaces by http_build_query with the
|
|
// more standard %20.
|
|
$query = str_replace('+', '%20', http_build_query($query));
|
|
}
|
|
|
|
$this->query = $query;
|
|
return $this;
|
|
}
|
|
|
|
/**
|
|
* Set the URI fragment part
|
|
*
|
|
* @param string $fragment
|
|
* @return Uri
|
|
* @throws Exception\InvalidUriPartException If the schema definition
|
|
* does not have this part
|
|
*/
|
|
public function setFragment($fragment)
|
|
{
|
|
$this->fragment = $fragment;
|
|
return $this;
|
|
}
|
|
|
|
/**
|
|
* Magic method to convert the URI to a string
|
|
*
|
|
* @return string
|
|
*/
|
|
public function __toString()
|
|
{
|
|
try {
|
|
return $this->toString();
|
|
} catch (\Exception $e) {
|
|
return '';
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Encoding and Validation Methods
|
|
*/
|
|
|
|
/**
|
|
* Check if a scheme is valid or not
|
|
*
|
|
* Will check $scheme to be valid against the generic scheme syntax defined
|
|
* in RFC-3986. If the class also defines specific acceptable schemes, will
|
|
* also check that $scheme is one of them.
|
|
*
|
|
* @param string $scheme
|
|
* @return bool
|
|
*/
|
|
public static function validateScheme($scheme)
|
|
{
|
|
if (!empty(static::$validSchemes)
|
|
&& !in_array(strtolower($scheme), static::$validSchemes)
|
|
) {
|
|
return false;
|
|
}
|
|
|
|
return (bool) preg_match('/^[A-Za-z][A-Za-z0-9\-\.+]*$/', $scheme);
|
|
}
|
|
|
|
/**
|
|
* Check that the userInfo part of a URI is valid
|
|
*
|
|
* @param string $userInfo
|
|
* @return bool
|
|
*/
|
|
public static function validateUserInfo($userInfo)
|
|
{
|
|
$regex = '/^(?:[' . self::CHAR_UNRESERVED . self::CHAR_SUB_DELIMS . ':]+|%[A-Fa-f0-9]{2})*$/';
|
|
return (bool) preg_match($regex, $userInfo);
|
|
}
|
|
|
|
/**
|
|
* Validate the host part
|
|
*
|
|
* Users may control which host types to allow by passing a second parameter
|
|
* with a bitmask of HOST_* constants which are allowed. If not specified,
|
|
* all address types will be allowed.
|
|
*
|
|
* Note that the generic URI syntax allows different host representations,
|
|
* including IPv4 addresses, IPv6 addresses and future IP address formats
|
|
* enclosed in square brackets, and registered names which may be DNS names
|
|
* or even more complex names. This is different (and is much more loose)
|
|
* from what is commonly accepted as valid HTTP URLs for example.
|
|
*
|
|
* @param string $host
|
|
* @param int $allowed bitmask of allowed host types
|
|
* @return bool
|
|
*/
|
|
public static function validateHost($host, $allowed = self::HOST_ALL)
|
|
{
|
|
/*
|
|
* "first-match-wins" algorithm (RFC 3986):
|
|
* If host matches the rule for IPv4address, then it should be
|
|
* considered an IPv4 address literal and not a reg-name
|
|
*/
|
|
if ($allowed & self::HOST_IPVANY) {
|
|
if (static::isValidIpAddress($host, $allowed)) {
|
|
return true;
|
|
}
|
|
}
|
|
|
|
if ($allowed & self::HOST_REGNAME) {
|
|
if (static::isValidRegName($host)) {
|
|
return true;
|
|
}
|
|
}
|
|
|
|
if ($allowed & self::HOST_DNS) {
|
|
if (static::isValidDnsHostname($host)) {
|
|
return true;
|
|
}
|
|
}
|
|
|
|
return false;
|
|
}
|
|
|
|
/**
|
|
* Validate the port
|
|
*
|
|
* Valid values include numbers between 1 and 65535, and empty values
|
|
*
|
|
* @param int $port
|
|
* @return bool
|
|
*/
|
|
public static function validatePort($port)
|
|
{
|
|
if ($port === 0) {
|
|
return false;
|
|
}
|
|
|
|
if ($port) {
|
|
$port = (int) $port;
|
|
if ($port < 1 || $port > 0xffff) {
|
|
return false;
|
|
}
|
|
}
|
|
|
|
return true;
|
|
}
|
|
|
|
/**
|
|
* Validate the path
|
|
*
|
|
* @param string $path
|
|
* @return bool
|
|
*/
|
|
public static function validatePath($path)
|
|
{
|
|
$pchar = '(?:[' . self::CHAR_UNRESERVED . ':@&=\+\$,]+|%[A-Fa-f0-9]{2})*';
|
|
$segment = $pchar . "(?:;{$pchar})*";
|
|
$regex = "/^{$segment}(?:\/{$segment})*$/";
|
|
return (bool) preg_match($regex, $path);
|
|
}
|
|
|
|
/**
|
|
* Check if a URI query or fragment part is valid or not
|
|
*
|
|
* Query and Fragment parts are both restricted by the same syntax rules,
|
|
* so the same validation method can be used for both.
|
|
*
|
|
* You can encode a query or fragment part to ensure it is valid by passing
|
|
* it through the encodeQueryFragment() method.
|
|
*
|
|
* @param string $input
|
|
* @return bool
|
|
*/
|
|
public static function validateQueryFragment($input)
|
|
{
|
|
$regex = '/^(?:[' . self::CHAR_UNRESERVED . self::CHAR_SUB_DELIMS . ':@\/\?]+|%[A-Fa-f0-9]{2})*$/';
|
|
return (bool) preg_match($regex, $input);
|
|
}
|
|
|
|
/**
|
|
* URL-encode the user info part of a URI
|
|
*
|
|
* @param string $userInfo
|
|
* @return string
|
|
* @throws Exception\InvalidArgumentException
|
|
*/
|
|
public static function encodeUserInfo($userInfo)
|
|
{
|
|
if (!is_string($userInfo)) {
|
|
throw new Exception\InvalidArgumentException(sprintf(
|
|
'Expecting a string, got %s',
|
|
(is_object($userInfo) ? get_class($userInfo) : gettype($userInfo))
|
|
));
|
|
}
|
|
|
|
$regex = '/(?:[^' . self::CHAR_UNRESERVED . self::CHAR_SUB_DELIMS . '%:]|%(?![A-Fa-f0-9]{2}))/';
|
|
$escaper = static::getEscaper();
|
|
$replace = function ($match) use ($escaper) {
|
|
return $escaper->escapeUrl($match[0]);
|
|
};
|
|
|
|
return preg_replace_callback($regex, $replace, $userInfo);
|
|
}
|
|
|
|
/**
|
|
* Encode the path
|
|
*
|
|
* Will replace all characters which are not strictly allowed in the path
|
|
* part with percent-encoded representation
|
|
*
|
|
* @param string $path
|
|
* @throws Exception\InvalidArgumentException
|
|
* @return string
|
|
*/
|
|
public static function encodePath($path)
|
|
{
|
|
if (!is_string($path)) {
|
|
throw new Exception\InvalidArgumentException(sprintf(
|
|
'Expecting a string, got %s',
|
|
(is_object($path) ? get_class($path) : gettype($path))
|
|
));
|
|
}
|
|
|
|
$regex = '/(?:[^' . self::CHAR_UNRESERVED . ':@&=\+\$,\/;%]+|%(?![A-Fa-f0-9]{2}))/';
|
|
$escaper = static::getEscaper();
|
|
$replace = function ($match) use ($escaper) {
|
|
return $escaper->escapeUrl($match[0]);
|
|
};
|
|
|
|
return preg_replace_callback($regex, $replace, $path);
|
|
}
|
|
|
|
/**
|
|
* URL-encode a query string or fragment based on RFC-3986 guidelines.
|
|
*
|
|
* Note that query and fragment encoding allows more unencoded characters
|
|
* than the usual rawurlencode() function would usually return - for example
|
|
* '/' and ':' are allowed as literals.
|
|
*
|
|
* @param string $input
|
|
* @return string
|
|
* @throws Exception\InvalidArgumentException
|
|
*/
|
|
public static function encodeQueryFragment($input)
|
|
{
|
|
if (!is_string($input)) {
|
|
throw new Exception\InvalidArgumentException(sprintf(
|
|
'Expecting a string, got %s',
|
|
(is_object($input) ? get_class($input) : gettype($input))
|
|
));
|
|
}
|
|
|
|
$regex = '/(?:[^' . self::CHAR_UNRESERVED . self::CHAR_SUB_DELIMS . '%:@\/\?]+|%(?![A-Fa-f0-9]{2}))/';
|
|
$escaper = static::getEscaper();
|
|
$replace = function ($match) use ($escaper) {
|
|
return $escaper->escapeUrl($match[0]);
|
|
};
|
|
|
|
return preg_replace_callback($regex, $replace, $input);
|
|
}
|
|
|
|
/**
|
|
* Extract only the scheme part out of a URI string.
|
|
*
|
|
* This is used by the parse() method, but is useful as a standalone public
|
|
* method if one wants to test a URI string for it's scheme before doing
|
|
* anything with it.
|
|
*
|
|
* Will return the scheme if found, or NULL if no scheme found (URI may
|
|
* still be valid, but not full)
|
|
*
|
|
* @param string $uriString
|
|
* @throws Exception\InvalidArgumentException
|
|
* @return string|null
|
|
*/
|
|
public static function parseScheme($uriString)
|
|
{
|
|
if (! is_string($uriString)) {
|
|
throw new Exception\InvalidArgumentException(sprintf(
|
|
'Expecting a string, got %s',
|
|
(is_object($uriString) ? get_class($uriString) : gettype($uriString))
|
|
));
|
|
}
|
|
|
|
if (preg_match('/^([A-Za-z][A-Za-z0-9\.\+\-]*):/', $uriString, $match)) {
|
|
return $match[1];
|
|
}
|
|
|
|
return null;
|
|
}
|
|
|
|
/**
|
|
* Remove any extra dot segments (/../, /./) from a path
|
|
*
|
|
* Algorithm is adapted from RFC-3986 section 5.2.4
|
|
* (@link http://tools.ietf.org/html/rfc3986#section-5.2.4)
|
|
*
|
|
* @todo consider optimizing
|
|
*
|
|
* @param string $path
|
|
* @return string
|
|
*/
|
|
public static function removePathDotSegments($path)
|
|
{
|
|
$output = '';
|
|
|
|
while ($path) {
|
|
if ($path == '..' || $path == '.') {
|
|
break;
|
|
}
|
|
|
|
switch (true) {
|
|
case ($path == '/.'):
|
|
$path = '/';
|
|
break;
|
|
case ($path == '/..'):
|
|
$path = '/';
|
|
$output = substr($output, 0, strrpos($output, '/', -1));
|
|
break;
|
|
case (substr($path, 0, 4) == '/../'):
|
|
$path = '/' . substr($path, 4);
|
|
$output = substr($output, 0, strrpos($output, '/', -1));
|
|
break;
|
|
case (substr($path, 0, 3) == '/./'):
|
|
$path = substr($path, 2);
|
|
break;
|
|
case (substr($path, 0, 2) == './'):
|
|
$path = substr($path, 2);
|
|
break;
|
|
case (substr($path, 0, 3) == '../'):
|
|
$path = substr($path, 3);
|
|
break;
|
|
default:
|
|
$slash = strpos($path, '/', 1);
|
|
if ($slash === false) {
|
|
$seg = $path;
|
|
} else {
|
|
$seg = substr($path, 0, $slash);
|
|
}
|
|
|
|
$output .= $seg;
|
|
$path = substr($path, strlen($seg));
|
|
break;
|
|
}
|
|
}
|
|
|
|
return $output;
|
|
}
|
|
|
|
/**
|
|
* Merge a base URI and a relative URI into a new URI object
|
|
*
|
|
* This convenience method wraps ::resolve() to allow users to quickly
|
|
* create new absolute URLs without the need to instantiate and clone
|
|
* URI objects.
|
|
*
|
|
* If objects are passed in, none of the passed objects will be modified.
|
|
*
|
|
* @param Uri|string $baseUri
|
|
* @param Uri|string $relativeUri
|
|
* @return Uri
|
|
*/
|
|
public static function merge($baseUri, $relativeUri)
|
|
{
|
|
$uri = new static($relativeUri);
|
|
return $uri->resolve($baseUri);
|
|
}
|
|
|
|
/**
|
|
* Check if a host name is a valid IP address, depending on allowed IP address types
|
|
*
|
|
* @param string $host
|
|
* @param int $allowed allowed address types
|
|
* @return bool
|
|
*/
|
|
protected static function isValidIpAddress($host, $allowed)
|
|
{
|
|
$validatorParams = array(
|
|
'allowipv4' => (bool) ($allowed & self::HOST_IPV4),
|
|
'allowipv6' => false,
|
|
'allowipvfuture' => false,
|
|
'allowliteral' => false,
|
|
);
|
|
|
|
// Test only IPv4
|
|
$validator = new Validator\Ip($validatorParams);
|
|
$return = $validator->isValid($host);
|
|
if ($return) {
|
|
return true;
|
|
}
|
|
|
|
// IPv6 & IPvLiteral must be in literal format
|
|
$validatorParams = array(
|
|
'allowipv4' => false,
|
|
'allowipv6' => (bool) ($allowed & self::HOST_IPV6),
|
|
'allowipvfuture' => (bool) ($allowed & self::HOST_IPVFUTURE),
|
|
'allowliteral' => true,
|
|
);
|
|
static $regex = '/^\[.*\]$/';
|
|
$validator->setOptions($validatorParams);
|
|
return (preg_match($regex, $host) && $validator->isValid($host));
|
|
}
|
|
|
|
/**
|
|
* Check if an address is a valid DNS hostname
|
|
*
|
|
* @param string $host
|
|
* @return bool
|
|
*/
|
|
protected static function isValidDnsHostname($host)
|
|
{
|
|
$validator = new Validator\Hostname(array(
|
|
'allow' => Validator\Hostname::ALLOW_DNS | Validator\Hostname::ALLOW_LOCAL,
|
|
));
|
|
|
|
return $validator->isValid($host);
|
|
}
|
|
|
|
/**
|
|
* Check if an address is a valid registered name (as defined by RFC-3986) address
|
|
*
|
|
* @param string $host
|
|
* @return bool
|
|
*/
|
|
protected static function isValidRegName($host)
|
|
{
|
|
$regex = '/^(?:[' . self::CHAR_UNRESERVED . self::CHAR_SUB_DELIMS . ':@\/\?]+|%[A-Fa-f0-9]{2})+$/';
|
|
return (bool) preg_match($regex, $host);
|
|
}
|
|
|
|
/**
|
|
* Part normalization methods
|
|
*
|
|
* These are called by normalize() using static::_normalize*() so they may
|
|
* be extended or overridden by extending classes to implement additional
|
|
* scheme specific normalization rules
|
|
*/
|
|
|
|
/**
|
|
* Normalize the scheme
|
|
*
|
|
* Usually this means simply converting the scheme to lower case
|
|
*
|
|
* @param string $scheme
|
|
* @return string
|
|
*/
|
|
protected static function normalizeScheme($scheme)
|
|
{
|
|
return strtolower($scheme);
|
|
}
|
|
|
|
/**
|
|
* Normalize the host part
|
|
*
|
|
* By default this converts host names to lower case
|
|
*
|
|
* @param string $host
|
|
* @return string
|
|
*/
|
|
protected static function normalizeHost($host)
|
|
{
|
|
return strtolower($host);
|
|
}
|
|
|
|
/**
|
|
* Normalize the port
|
|
*
|
|
* If the class defines a default port for the current scheme, and the
|
|
* current port is default, it will be unset.
|
|
*
|
|
* @param int $port
|
|
* @param string $scheme
|
|
* @return int|null
|
|
*/
|
|
protected static function normalizePort($port, $scheme = null)
|
|
{
|
|
if ($scheme
|
|
&& isset(static::$defaultPorts[$scheme])
|
|
&& ($port == static::$defaultPorts[$scheme])
|
|
) {
|
|
return null;
|
|
}
|
|
|
|
return $port;
|
|
}
|
|
|
|
/**
|
|
* Normalize the path
|
|
*
|
|
* This involves removing redundant dot segments, decoding any over-encoded
|
|
* characters and encoding everything that needs to be encoded and is not
|
|
*
|
|
* @param string $path
|
|
* @return string
|
|
*/
|
|
protected static function normalizePath($path)
|
|
{
|
|
$path = self::encodePath(
|
|
self::decodeUrlEncodedChars(
|
|
self::removePathDotSegments($path),
|
|
'/[' . self::CHAR_UNRESERVED . ':@&=\+\$,\/;%]/'
|
|
)
|
|
);
|
|
|
|
return $path;
|
|
}
|
|
|
|
/**
|
|
* Normalize the query part
|
|
*
|
|
* This involves decoding everything that doesn't need to be encoded, and
|
|
* encoding everything else
|
|
*
|
|
* @param string $query
|
|
* @return string
|
|
*/
|
|
protected static function normalizeQuery($query)
|
|
{
|
|
$query = self::encodeQueryFragment(
|
|
self::decodeUrlEncodedChars(
|
|
$query,
|
|
'/[' . self::CHAR_UNRESERVED . self::CHAR_QUERY_DELIMS . ':@\/\?]/'
|
|
)
|
|
);
|
|
|
|
return $query;
|
|
}
|
|
|
|
/**
|
|
* Normalize the fragment part
|
|
*
|
|
* Currently this is exactly the same as normalizeQuery().
|
|
*
|
|
* @param string $fragment
|
|
* @return string
|
|
*/
|
|
protected static function normalizeFragment($fragment)
|
|
{
|
|
$fragment = self::encodeQueryFragment(
|
|
self::decodeUrlEncodedChars(
|
|
$fragment,
|
|
'/[' . self::CHAR_UNRESERVED . self::CHAR_SUB_DELIMS . '%:@\/\?]/'
|
|
)
|
|
);
|
|
|
|
return $fragment;
|
|
}
|
|
|
|
/**
|
|
* Decode all percent encoded characters which are allowed to be represented literally
|
|
*
|
|
* Will not decode any characters which are not listed in the 'allowed' list
|
|
*
|
|
* @param string $input
|
|
* @param string $allowed Pattern of allowed characters
|
|
* @return mixed
|
|
*/
|
|
protected static function decodeUrlEncodedChars($input, $allowed = '')
|
|
{
|
|
$decodeCb = function ($match) use ($allowed) {
|
|
$char = rawurldecode($match[0]);
|
|
if (preg_match($allowed, $char)) {
|
|
return $char;
|
|
}
|
|
return strtoupper($match[0]);
|
|
};
|
|
|
|
return preg_replace_callback('/%[A-Fa-f0-9]{2}/', $decodeCb, $input);
|
|
}
|
|
}
|