499 lines
18 KiB
PHP
499 lines
18 KiB
PHP
<?php
|
|
/**
|
|
* Stores cookies and passes them between HTTP requests
|
|
*
|
|
* PHP version 5
|
|
*
|
|
* LICENSE:
|
|
*
|
|
* Copyright (c) 2008-2011, Alexey Borzov <avb@php.net>
|
|
* All rights reserved.
|
|
*
|
|
* Redistribution and use in source and binary forms, with or without
|
|
* modification, are permitted provided that the following conditions
|
|
* are met:
|
|
*
|
|
* * Redistributions of source code must retain the above copyright
|
|
* notice, this list of conditions and the following disclaimer.
|
|
* * Redistributions in binary form must reproduce the above copyright
|
|
* notice, this list of conditions and the following disclaimer in the
|
|
* documentation and/or other materials provided with the distribution.
|
|
* * The names of the authors may not be used to endorse or promote products
|
|
* derived from this software without specific prior written permission.
|
|
*
|
|
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS
|
|
* IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO,
|
|
* THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
|
|
* PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
|
|
* CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
|
|
* EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
|
|
* PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
|
|
* PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY
|
|
* OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
|
|
* NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
|
|
* SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
*
|
|
* @category HTTP
|
|
* @package HTTP_Request2
|
|
* @author Alexey Borzov <avb@php.net>
|
|
* @license http://opensource.org/licenses/bsd-license.php New BSD License
|
|
* @version SVN: $Id: CookieJar.php 308629 2011-02-24 17:34:24Z avb $
|
|
* @link http://pear.php.net/package/HTTP_Request2
|
|
*/
|
|
|
|
/** Class representing a HTTP request message */
|
|
require_once 'HTTP/Request2.php';
|
|
|
|
/**
|
|
* Stores cookies and passes them between HTTP requests
|
|
*
|
|
* @category HTTP
|
|
* @package HTTP_Request2
|
|
* @author Alexey Borzov <avb@php.net>
|
|
* @version Release: @package_version@
|
|
*/
|
|
class HTTP_Request2_CookieJar implements Serializable
|
|
{
|
|
/**
|
|
* Array of stored cookies
|
|
*
|
|
* The array is indexed by domain, path and cookie name
|
|
* .example.com
|
|
* /
|
|
* some_cookie => cookie data
|
|
* /subdir
|
|
* other_cookie => cookie data
|
|
* .example.org
|
|
* ...
|
|
*
|
|
* @var array
|
|
*/
|
|
protected $cookies = array();
|
|
|
|
/**
|
|
* Whether session cookies should be serialized when serializing the jar
|
|
* @var bool
|
|
*/
|
|
protected $serializeSession = false;
|
|
|
|
/**
|
|
* Whether Public Suffix List should be used for domain matching
|
|
* @var bool
|
|
*/
|
|
protected $useList = true;
|
|
|
|
/**
|
|
* Array with Public Suffix List data
|
|
* @var array
|
|
* @link http://publicsuffix.org/
|
|
*/
|
|
protected static $psl = array();
|
|
|
|
/**
|
|
* Class constructor, sets various options
|
|
*
|
|
* @param bool Controls serializing session cookies, see {@link serializeSessionCookies()}
|
|
* @param bool Controls using Public Suffix List, see {@link usePublicSuffixList()}
|
|
*/
|
|
public function __construct($serializeSessionCookies = false, $usePublicSuffixList = true)
|
|
{
|
|
$this->serializeSessionCookies($serializeSessionCookies);
|
|
$this->usePublicSuffixList($usePublicSuffixList);
|
|
}
|
|
|
|
/**
|
|
* Returns current time formatted in ISO-8601 at UTC timezone
|
|
*
|
|
* @return string
|
|
*/
|
|
protected function now()
|
|
{
|
|
$dt = new DateTime();
|
|
$dt->setTimezone(new DateTimeZone('UTC'));
|
|
return $dt->format(DateTime::ISO8601);
|
|
}
|
|
|
|
/**
|
|
* Checks cookie array for correctness, possibly updating its 'domain', 'path' and 'expires' fields
|
|
*
|
|
* The checks are as follows:
|
|
* - cookie array should contain 'name' and 'value' fields;
|
|
* - name and value should not contain disallowed symbols;
|
|
* - 'expires' should be either empty parseable by DateTime;
|
|
* - 'domain' and 'path' should be either not empty or an URL where
|
|
* cookie was set should be provided.
|
|
* - if $setter is provided, then document at that URL should be allowed
|
|
* to set a cookie for that 'domain'. If $setter is not provided,
|
|
* then no domain checks will be made.
|
|
*
|
|
* 'expires' field will be converted to ISO8601 format from COOKIE format,
|
|
* 'domain' and 'path' will be set from setter URL if empty.
|
|
*
|
|
* @param array cookie data, as returned by {@link HTTP_Request2_Response::getCookies()}
|
|
* @param Net_URL2 URL of the document that sent Set-Cookie header
|
|
* @return array Updated cookie array
|
|
* @throws HTTP_Request2_LogicException
|
|
* @throws HTTP_Request2_MessageException
|
|
*/
|
|
protected function checkAndUpdateFields(array $cookie, Net_URL2 $setter = null)
|
|
{
|
|
if ($missing = array_diff(array('name', 'value'), array_keys($cookie))) {
|
|
throw new HTTP_Request2_LogicException(
|
|
"Cookie array should contain 'name' and 'value' fields",
|
|
HTTP_Request2_Exception::MISSING_VALUE
|
|
);
|
|
}
|
|
if (preg_match(HTTP_Request2::REGEXP_INVALID_COOKIE, $cookie['name'])) {
|
|
throw new HTTP_Request2_LogicException(
|
|
"Invalid cookie name: '{$cookie['name']}'",
|
|
HTTP_Request2_Exception::INVALID_ARGUMENT
|
|
);
|
|
}
|
|
if (preg_match(HTTP_Request2::REGEXP_INVALID_COOKIE, $cookie['value'])) {
|
|
throw new HTTP_Request2_LogicException(
|
|
"Invalid cookie value: '{$cookie['value']}'",
|
|
HTTP_Request2_Exception::INVALID_ARGUMENT
|
|
);
|
|
}
|
|
$cookie += array('domain' => '', 'path' => '', 'expires' => null, 'secure' => false);
|
|
|
|
// Need ISO-8601 date @ UTC timezone
|
|
if (!empty($cookie['expires'])
|
|
&& !preg_match('/^\\d{4}-\\d{2}-\\d{2}T\\d{2}:\\d{2}:\\d{2}\\+0000$/', $cookie['expires'])
|
|
) {
|
|
try {
|
|
$dt = new DateTime($cookie['expires']);
|
|
$dt->setTimezone(new DateTimeZone('UTC'));
|
|
$cookie['expires'] = $dt->format(DateTime::ISO8601);
|
|
} catch (Exception $e) {
|
|
throw new HTTP_Request2_LogicException($e->getMessage());
|
|
}
|
|
}
|
|
|
|
if (empty($cookie['domain']) || empty($cookie['path'])) {
|
|
if (!$setter) {
|
|
throw new HTTP_Request2_LogicException(
|
|
'Cookie misses domain and/or path component, cookie setter URL needed',
|
|
HTTP_Request2_Exception::MISSING_VALUE
|
|
);
|
|
}
|
|
if (empty($cookie['domain'])) {
|
|
if ($host = $setter->getHost()) {
|
|
$cookie['domain'] = $host;
|
|
} else {
|
|
throw new HTTP_Request2_LogicException(
|
|
'Setter URL does not contain host part, can\'t set cookie domain',
|
|
HTTP_Request2_Exception::MISSING_VALUE
|
|
);
|
|
}
|
|
}
|
|
if (empty($cookie['path'])) {
|
|
$path = $setter->getPath();
|
|
$cookie['path'] = empty($path)? '/': substr($path, 0, strrpos($path, '/') + 1);
|
|
}
|
|
}
|
|
|
|
if ($setter && !$this->domainMatch($setter->getHost(), $cookie['domain'])) {
|
|
throw new HTTP_Request2_MessageException(
|
|
"Domain " . $setter->getHost() . " cannot set cookies for "
|
|
. $cookie['domain']
|
|
);
|
|
}
|
|
|
|
return $cookie;
|
|
}
|
|
|
|
/**
|
|
* Stores a cookie in the jar
|
|
*
|
|
* @param array cookie data, as returned by {@link HTTP_Request2_Response::getCookies()}
|
|
* @param Net_URL2 URL of the document that sent Set-Cookie header
|
|
* @throws HTTP_Request2_Exception
|
|
*/
|
|
public function store(array $cookie, Net_URL2 $setter = null)
|
|
{
|
|
$cookie = $this->checkAndUpdateFields($cookie, $setter);
|
|
|
|
if (strlen($cookie['value'])
|
|
&& (is_null($cookie['expires']) || $cookie['expires'] > $this->now())
|
|
) {
|
|
if (!isset($this->cookies[$cookie['domain']])) {
|
|
$this->cookies[$cookie['domain']] = array();
|
|
}
|
|
if (!isset($this->cookies[$cookie['domain']][$cookie['path']])) {
|
|
$this->cookies[$cookie['domain']][$cookie['path']] = array();
|
|
}
|
|
$this->cookies[$cookie['domain']][$cookie['path']][$cookie['name']] = $cookie;
|
|
|
|
} elseif (isset($this->cookies[$cookie['domain']][$cookie['path']][$cookie['name']])) {
|
|
unset($this->cookies[$cookie['domain']][$cookie['path']][$cookie['name']]);
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Adds cookies set in HTTP response to the jar
|
|
*
|
|
* @param HTTP_Request2_Response response
|
|
* @param Net_URL2 original request URL, needed for setting
|
|
* default domain/path
|
|
*/
|
|
public function addCookiesFromResponse(HTTP_Request2_Response $response, Net_URL2 $setter)
|
|
{
|
|
foreach ($response->getCookies() as $cookie) {
|
|
$this->store($cookie, $setter);
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Returns all cookies matching a given request URL
|
|
*
|
|
* The following checks are made:
|
|
* - cookie domain should match request host
|
|
* - cookie path should be a prefix for request path
|
|
* - 'secure' cookies will only be sent for HTTPS requests
|
|
*
|
|
* @param Net_URL2
|
|
* @param bool Whether to return cookies as string for "Cookie: " header
|
|
* @return array
|
|
*/
|
|
public function getMatching(Net_URL2 $url, $asString = false)
|
|
{
|
|
$host = $url->getHost();
|
|
$path = $url->getPath();
|
|
$secure = 0 == strcasecmp($url->getScheme(), 'https');
|
|
|
|
$matched = $ret = array();
|
|
foreach (array_keys($this->cookies) as $domain) {
|
|
if ($this->domainMatch($host, $domain)) {
|
|
foreach (array_keys($this->cookies[$domain]) as $cPath) {
|
|
if (0 === strpos($path, $cPath)) {
|
|
foreach ($this->cookies[$domain][$cPath] as $name => $cookie) {
|
|
if (!$cookie['secure'] || $secure) {
|
|
$matched[$name][strlen($cookie['path'])] = $cookie;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
foreach ($matched as $cookies) {
|
|
krsort($cookies);
|
|
$ret = array_merge($ret, $cookies);
|
|
}
|
|
if (!$asString) {
|
|
return $ret;
|
|
} else {
|
|
$str = '';
|
|
foreach ($ret as $c) {
|
|
$str .= (empty($str)? '': '; ') . $c['name'] . '=' . $c['value'];
|
|
}
|
|
return $str;
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Returns all cookies stored in a jar
|
|
*
|
|
* @return array
|
|
*/
|
|
public function getAll()
|
|
{
|
|
$cookies = array();
|
|
foreach (array_keys($this->cookies) as $domain) {
|
|
foreach (array_keys($this->cookies[$domain]) as $path) {
|
|
foreach ($this->cookies[$domain][$path] as $name => $cookie) {
|
|
$cookies[] = $cookie;
|
|
}
|
|
}
|
|
}
|
|
return $cookies;
|
|
}
|
|
|
|
/**
|
|
* Sets whether session cookies should be serialized when serializing the jar
|
|
*
|
|
* @param boolean
|
|
*/
|
|
public function serializeSessionCookies($serialize)
|
|
{
|
|
$this->serializeSession = (bool)$serialize;
|
|
}
|
|
|
|
/**
|
|
* Sets whether Public Suffix List should be used for restricting cookie-setting
|
|
*
|
|
* Without PSL {@link domainMatch()} will only prevent setting cookies for
|
|
* top-level domains like '.com' or '.org'. However, it will not prevent
|
|
* setting a cookie for '.co.uk' even though only third-level registrations
|
|
* are possible in .uk domain.
|
|
*
|
|
* With the List it is possible to find the highest level at which a domain
|
|
* may be registered for a particular top-level domain and consequently
|
|
* prevent cookies set for '.co.uk' or '.msk.ru'. The same list is used by
|
|
* Firefox, Chrome and Opera browsers to restrict cookie setting.
|
|
*
|
|
* Note that PSL is licensed differently to HTTP_Request2 package (refer to
|
|
* the license information in public-suffix-list.php), so you can disable
|
|
* its use if this is an issue for you.
|
|
*
|
|
* @param boolean
|
|
* @link http://publicsuffix.org/learn/
|
|
*/
|
|
public function usePublicSuffixList($useList)
|
|
{
|
|
$this->useList = (bool)$useList;
|
|
}
|
|
|
|
/**
|
|
* Returns string representation of object
|
|
*
|
|
* @return string
|
|
* @see Serializable::serialize()
|
|
*/
|
|
public function serialize()
|
|
{
|
|
$cookies = $this->getAll();
|
|
if (!$this->serializeSession) {
|
|
for ($i = count($cookies) - 1; $i >= 0; $i--) {
|
|
if (empty($cookies[$i]['expires'])) {
|
|
unset($cookies[$i]);
|
|
}
|
|
}
|
|
}
|
|
return serialize(array(
|
|
'cookies' => $cookies,
|
|
'serializeSession' => $this->serializeSession,
|
|
'useList' => $this->useList
|
|
));
|
|
}
|
|
|
|
/**
|
|
* Constructs the object from serialized string
|
|
*
|
|
* @param string string representation
|
|
* @see Serializable::unserialize()
|
|
*/
|
|
public function unserialize($serialized)
|
|
{
|
|
$data = unserialize($serialized);
|
|
$now = $this->now();
|
|
$this->serializeSessionCookies($data['serializeSession']);
|
|
$this->usePublicSuffixList($data['useList']);
|
|
foreach ($data['cookies'] as $cookie) {
|
|
if (!empty($cookie['expires']) && $cookie['expires'] <= $now) {
|
|
continue;
|
|
}
|
|
if (!isset($this->cookies[$cookie['domain']])) {
|
|
$this->cookies[$cookie['domain']] = array();
|
|
}
|
|
if (!isset($this->cookies[$cookie['domain']][$cookie['path']])) {
|
|
$this->cookies[$cookie['domain']][$cookie['path']] = array();
|
|
}
|
|
$this->cookies[$cookie['domain']][$cookie['path']][$cookie['name']] = $cookie;
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Checks whether a cookie domain matches a request host.
|
|
*
|
|
* The method is used by {@link store()} to check for whether a document
|
|
* at given URL can set a cookie with a given domain attribute and by
|
|
* {@link getMatching()} to find cookies matching the request URL.
|
|
*
|
|
* @param string request host
|
|
* @param string cookie domain
|
|
* @return bool match success
|
|
*/
|
|
public function domainMatch($requestHost, $cookieDomain)
|
|
{
|
|
if ($requestHost == $cookieDomain) {
|
|
return true;
|
|
}
|
|
// IP address, we require exact match
|
|
if (preg_match('/^(?:\d{1,3}\.){3}\d{1,3}$/', $requestHost)) {
|
|
return false;
|
|
}
|
|
if ('.' != $cookieDomain[0]) {
|
|
$cookieDomain = '.' . $cookieDomain;
|
|
}
|
|
// prevents setting cookies for '.com' and similar domains
|
|
if (!$this->useList && substr_count($cookieDomain, '.') < 2
|
|
|| $this->useList && !self::getRegisteredDomain($cookieDomain)
|
|
) {
|
|
return false;
|
|
}
|
|
return substr('.' . $requestHost, -strlen($cookieDomain)) == $cookieDomain;
|
|
}
|
|
|
|
/**
|
|
* Removes subdomains to get the registered domain (the first after top-level)
|
|
*
|
|
* The method will check Public Suffix List to find out where top-level
|
|
* domain ends and registered domain starts. It will remove domain parts
|
|
* to the left of registered one.
|
|
*
|
|
* @param string domain name
|
|
* @return string|bool registered domain, will return false if $domain is
|
|
* either invalid or a TLD itself
|
|
*/
|
|
public static function getRegisteredDomain($domain)
|
|
{
|
|
$domainParts = explode('.', ltrim($domain, '.'));
|
|
|
|
// load the list if needed
|
|
if (empty(self::$psl)) {
|
|
$path = '@data_dir@' . DIRECTORY_SEPARATOR . 'HTTP_Request2';
|
|
if (0 === strpos($path, '@' . 'data_dir@')) {
|
|
$path = realpath(dirname(__FILE__) . DIRECTORY_SEPARATOR . '..'
|
|
. DIRECTORY_SEPARATOR . 'data');
|
|
}
|
|
self::$psl = include_once $path . DIRECTORY_SEPARATOR . 'public-suffix-list.php';
|
|
}
|
|
|
|
if (!($result = self::checkDomainsList($domainParts, self::$psl))) {
|
|
// known TLD, invalid domain name
|
|
return false;
|
|
}
|
|
|
|
// unknown TLD
|
|
if (!strpos($result, '.')) {
|
|
// fallback to checking that domain "has at least two dots"
|
|
if (2 > ($count = count($domainParts))) {
|
|
return false;
|
|
}
|
|
return $domainParts[$count - 2] . '.' . $domainParts[$count - 1];
|
|
}
|
|
return $result;
|
|
}
|
|
|
|
/**
|
|
* Recursive helper method for {@link getRegisteredDomain()}
|
|
*
|
|
* @param array remaining domain parts
|
|
* @param mixed node in {@link HTTP_Request2_CookieJar::$psl} to check
|
|
* @return string|null concatenated domain parts, null in case of error
|
|
*/
|
|
protected static function checkDomainsList(array $domainParts, $listNode)
|
|
{
|
|
$sub = array_pop($domainParts);
|
|
$result = null;
|
|
|
|
if (!is_array($listNode) || is_null($sub)
|
|
|| array_key_exists('!' . $sub, $listNode)
|
|
) {
|
|
return $sub;
|
|
|
|
} elseif (array_key_exists($sub, $listNode)) {
|
|
$result = self::checkDomainsList($domainParts, $listNode[$sub]);
|
|
|
|
} elseif (array_key_exists('*', $listNode)) {
|
|
$result = self::checkDomainsList($domainParts, $listNode['*']);
|
|
|
|
} else {
|
|
return $sub;
|
|
}
|
|
|
|
return (strlen($result) > 0) ? ($result . '.' . $sub) : null;
|
|
}
|
|
}
|
|
?>
|