blob: 37c134553140f2cb152b9269ad72aa134e9d1a8b [file] [log] [blame]
<?php
/*
* SimpleID
*
* Copyright (C) Kelvin Mo 2007-9
*
* This program is free software; you can redistribute it and/or
* modify it under the terms of the GNU General Public
* License as published by the Free Software Foundation; either
* version 2 of the License, or (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
* General Public License for more details.
*
* You should have received a copy of the GNU General Public
* License along with this program; if not, write to the Free
* Software Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
*
* $Id$
*/
/**
* Functions for making and processing HTTP requests.
*
* @package simpleid
* @since 0.7
* @filesource
*/
/**
* The user agent to use during HTTP requests.
*/
define('SIMPLEHTTP_USER_AGENT', 'SimpleHTTP/' . substr('$Rev$', 6, -2));
/**
* Performs an HTTP request.
*
* Communication with the web server is conducted using libcurl where possible.
* Where libcurl does not exist, then sockets will be used.
*
* Note that the request must be properly prepared before passing onto this function.
* For example, for POST requests, the Content-Type and Content-Length headers must be
* included in $headers.
*
* @param string $url the URL
* @param array $headers HTTP headers containing name => value pairs
* @param string $body the request body
* @param string $method the HTTP request method
* @param int $retry the maximum number of redirects allowed
* @return array containing keys 'error-code' (for communication errors), 'error'
* (for communication errors), 'data' (content returned), 'code' (the HTTP status code), 'http-error'
* (if the HTTP status code is not 200 or 304), 'protocol' (the HTTP protocol in the response),
* 'headers' (an array of return headers in lowercase),
* 'content-type' (the HTTP content-type returned)
*/
function http_make_request($url, $headers = array(), $body = NULL, $method = 'GET', $retry = 3) {
// If CURL is available, we use it
if (extension_loaded('curl')) {
$response = _http_make_request_curl($url, $headers, $body, $method, $retry);
} else {
$response = _http_make_request_fsock($url, $headers, $body, $method, $retry);
}
if (!isset($response['error-code'])) {
$valid_codes = array(
100, 101,
200, 201, 202, 203, 204, 205, 206,
300, 301, 302, 303, 304, 305, 307,
400, 401, 402, 403, 404, 405, 406, 407, 408, 409, 410, 411, 412, 413, 414, 415, 416, 417,
500, 501, 502, 503, 504, 505
);
// RFC 2616 states that all unknown HTTP codes must be treated the same as the
// base code in their class.
if (!in_array($response['code'], $valid_codes)) {
$response['code'] = floor($response['code'] / 100) * 100;
}
if (($response['code'] != 200) && ($response['code'] != 304)) {
$response['http-error'] = $response['code'];
}
}
return $response;
}
/**
* Returns the protocols currently supported for making remote requests.
*
* If libcurl is used, this function returns a list of protocols supported by the
* included build of the library. If libcurl is not used, then HTTP is the
* only protocol supported.
*
* @return array an array of protocols
*/
function http_protocols() {
if (extension_loaded('curl')) {
$curl_version = curl_version();
return $curl_version['protocols'];
} else {
return array('http');
}
}
/**
* Performs an HTTP request using libcurl.
*
* @param string $url the URL
* @param array $headers HTTP headers containing name => value pairs
* @param string $body the request body
* @param string $method the HTTP request method
* @param int $retry the maximum number of redirects allowed
* @return array containing keys 'error-code' (for communication errors), 'error'
* (for communication errors), 'data' (content returned), 'code' (the HTTP status code), 'http-error'
* (if the HTTP status code is not 200 or 304), 'headers' (an array of return headers),
* 'content-type' (the HTTP content-type returned)
*/
function _http_make_request_curl($url, $headers = array(), $body = NULL, $method = 'GET', $retry = 3) {
// CURLOPT_FOLLOWLOCATION only works when safe mode is off or when open_basedir is set
// In these instances we will need to follow redirects manually
$manual_redirect = ((@ini_get('safe_mode') === 1) // safe mode
|| (strtolower(@ini_get('safe_mode')) == 'on') // safe mode
|| (@ini_get('open_basedir') != false)); // open_basedir
$version = curl_version();
$curl = curl_init($url);
if (version_compare($version['version'], '7.10.5', '>=')) {
curl_setopt($curl, CURLOPT_ENCODING, '');
}
if (!$manual_redirect) curl_setopt($curl, CURLOPT_FOLLOWLOCATION, true);
curl_setopt($curl, CURLOPT_CUSTOMREQUEST, $method);
curl_setopt($curl, CURLOPT_MAXREDIRS, $retry);
curl_setopt($curl, CURLOPT_HTTPHEADER, array(implode("\n", $headers) . "\n"));
curl_setopt($curl, CURLOPT_USERAGENT, SIMPLEHTTP_USER_AGENT);
curl_setopt($curl, CURLOPT_TIMEOUT, 20);
curl_setopt($curl, CURLOPT_CONNECTTIMEOUT, 20);
curl_setopt($curl, CURLOPT_RETURNTRANSFER, true);
curl_setopt($curl, CURLOPT_HEADER, true);
curl_setopt($curl, CURLOPT_SSL_VERIFYPEER, false);
curl_setopt($curl, CURLOPT_SSL_VERIFYHOST, false);
if ($body != NULL) curl_setopt($curl, CURLOPT_POSTFIELDS, $body);
$response = curl_exec($curl);
if (($response === FALSE) && ((curl_errno($curl) == 23) || (curl_errno($curl) == 61))) {
curl_setopt($curl, CURLOPT_ENCODING, 'none');
$response = curl_exec($curl);
}
if ($response === FALSE) {
$result = array();
$result['error-code'] = curl_errno($curl);
$result['error'] = curl_error($curl);
} else {
$result['code'] = curl_getinfo($curl, CURLINFO_HTTP_CODE);
$result['url'] = curl_getinfo($curl, CURLINFO_EFFECTIVE_URL);
$result['content-type'] = curl_getinfo($curl, CURLINFO_CONTENT_TYPE);
// Parse response.
$result['raw'] = $response;
$header_size = curl_getinfo($curl, CURLINFO_HEADER_SIZE);
$result['data'] = substr($response, $header_size);
$response_headers = substr($response, 0, $header_size - 4);
// In case where redirect occurs, we want the last set of headers
$header_blocks = explode("\r\n\r\n", $response_headers);
$header_block = array_pop($header_blocks);
$result = array_merge($result, _http_parse_headers($header_block, TRUE));
// If we are in safe mode, we need to process redirects manually
if ($manual_redirect && (($result['code'] == 301) || ($result['code'] == 302) || ($result['code'] == 307))) {
if ($retry == 0) {
// Too many times, return an error
$result['error-code'] = 47;
$result['error'] = 'Too many redirects';
} else {
curl_close($curl);
return _http_make_request_curl($result['headers']['location'], $headers, $body, $method, $retry - 1);
}
}
}
curl_close($curl);
return $result;
}
/**
* Performs an HTTP request using sockets.
*
* @param string $url the URL
* @param array $headers HTTP headers containing name => value pairs
* @param string $body the request body
* @param string $method the HTTP request method
* @param int $retry the maximum number of redirects allowed
* @return array containing keys 'error-code' (for communication errors), 'error'
* (for communication errors), 'data' (content returned), 'code' (the HTTP status code), 'http-error'
* (if the HTTP status code is not 200 or 304), 'headers' (an array of return headers),
* 'content-type' (the HTTP content-type returned)
*/
function _http_make_request_fsock($url, $headers = array(), $body = NULL, $method = 'GET', $retry = 3) {
$result = array();
$parts = parse_url($url);
if (!isset($parts)) {
$result['error-code'] = 3;
$result['error'] = 'URL not properly formatted';
return $result;
}
if ($parts['scheme'] == 'http') {
$port = isset($parts['port']) ? $parts['port'] : 80;
$host = $parts['host'];
} elseif ($parts['scheme'] == 'https') {
$port = isset($parts['port']) ? $parts['port'] : 443;
$host = 'ssl://' . $parts['host'];
} else {
$result['error-code'] = 1;
$result['error'] = 'Unsupported protocol';
}
$fp = @fsockopen($host, $port, $errno, $errstr, 15);
if (!$fp) {
$result['error-code'] = 7;
$result['error'] = "Cannot connect: Error $errno:" . trim($errstr);
return $result;
}
if (isset($parts['path'])) {
$path = $url_parts['path'];
if (isset($parts['query'])) $path .= '?' . $url_parts['query'];
} else {
$path = '/';
}
$headers = array_merge(
array(
'Host' => $parts['host'],
'User-Agent' => SIMPLEHTTP_USER_AGENT,
'Connection' => 'close'
),
$headers
);
if (isset($parts['user']) && isset($parts['pass'])) {
$headers['Authorization'] = 'Basic '. base64_encode($parts['user'] . (!empty($parts['pass']) ? ":". $parts['pass'] : ''));
}
$request = $method . ' '. $path ." HTTP/1.0\r\n";
$keys = array_keys($headers);
for ($i = 0; $i < count($keys); $i++) {
$request .= $keys[$i] . ': ' . $headers[$keys[$i]] . "\r\n";
}
// End of headers - separator
$request .= "\r\n";
if ($body != NULL) $request .= $body;
fwrite($fp, $request);
// Fetch response.
$response = '';
while (!feof($fp) && $chunk = fread($fp, 1024)) {
$response .= $chunk;
}
fclose($fp);
// Parse response.
list($header_block, $result['data']) = explode("\r\n\r\n", $response, 2);
$result = array_merge($result, _http_parse_headers($header_block, FALSE));
// Process redirects
if (($result['code'] == 301) || ($result['code'] == 302) || ($result['code'] == 307)) {
if ($retry == 0) {
// Too many times, return an error
$result['error-code'] = 47;
$result['error'] = 'Too many redirects';
} else {
$result = _http_make_request_fsock($result['headers']['location'], $headers, $body, $method, $retry - 1);
}
}
$result['url'] = $url;
return $result;
}
/**
* Parses HTTP response headers.
*
* @param string $header_block the unparsed header block
* @param bool $curl if true, use simplified parsing as libcurl already parses
* the headers
* @return an array containing the following keys: 'protocol' (the HTTP protocol in the response),
* 'headers' (an array of return headers in lowercase). If $curl is false, additional
* parsing is done for 'code' and 'content-type'
*/
function _http_parse_headers($header_block, $curl) {
$headers = array();
$result = array();
// Split the status line from the rest of the message header
list($status, $header_block) = preg_split("/\r\n|\n|\r/", $header_block, 2);
// RFC 2616, section 4.2: Header fields can be extended over multiple lines
// by preceding each extra line with at least one space or tab. So we need
// to join them...
$header_block = preg_replace('/(\r\n|\n|\r)( |\t)+/', '', $header_block);
// Then split them to get the fields
$fields = preg_split("/\r\n|\n|\r/", $header_block);
// Parse the status line
list($protocol, $code, $reason) = explode(' ', trim($status), 3);
$result['protocol'] = $protocol;
if (!$curl) $result['code'] = $code;
// Parse headers.
while ($field = trim(array_shift($fields))) {
list($header, $value) = explode(':', $field, 2);
// Headers are case insensitive
$header = strtolower($header);
if (isset($headers[$header])) {
// RFC 2616, section 4.2: Multiple headers with the same field
// name is the same as a concatenating all the headers in a single
// header, separated by commas.
$headers[$header] .= ','. trim($value);
} else {
$headers[$header] = trim($value);
}
if (!$curl && (strtolower($header) == 'content-type')) $result['content-type'] = $value;
}
$result['headers'] = $headers;
return $result;
}
?>