2013-07-16 19:54:44 -04:00
|
|
|
<?php
|
|
|
|
|
2014-12-23 21:28:26 -05:00
|
|
|
namespace PicoFeed\Client;
|
2013-07-16 19:54:44 -04:00
|
|
|
|
2014-12-23 21:28:26 -05:00
|
|
|
use PicoFeed\Logging\Logger;
|
2013-07-16 19:54:44 -04:00
|
|
|
|
2014-03-16 21:35:57 -04:00
|
|
|
/**
|
2015-10-19 22:49:30 -04:00
|
|
|
* Stream context HTTP client.
|
2014-03-16 21:35:57 -04:00
|
|
|
*
|
|
|
|
* @author Frederic Guillot
|
|
|
|
*/
|
2014-05-20 14:20:27 -04:00
|
|
|
class Stream extends Client
|
2013-07-16 19:54:44 -04:00
|
|
|
{
|
2014-03-16 21:35:57 -04:00
|
|
|
/**
|
2015-10-19 22:49:30 -04:00
|
|
|
* Prepare HTTP headers.
|
2014-03-16 21:35:57 -04:00
|
|
|
*
|
2014-12-23 21:28:26 -05:00
|
|
|
* @return string[]
|
2014-03-16 21:35:57 -04:00
|
|
|
*/
|
2014-10-19 14:42:31 -04:00
|
|
|
private function prepareHeaders()
|
2013-07-16 19:54:44 -04:00
|
|
|
{
|
|
|
|
$headers = array(
|
|
|
|
'Connection: close',
|
|
|
|
'User-Agent: '.$this->user_agent,
|
|
|
|
);
|
|
|
|
|
2015-02-05 21:16:34 -05:00
|
|
|
// disable compression in passthrough mode. It could result in double
|
|
|
|
// compressed content which isn't decodeable by browsers
|
2015-10-19 22:49:30 -04:00
|
|
|
if (function_exists('gzdecode') && !$this->isPassthroughEnabled()) {
|
2014-05-20 14:20:27 -04:00
|
|
|
$headers[] = 'Accept-Encoding: gzip';
|
|
|
|
}
|
|
|
|
|
|
|
|
if ($this->etag) {
|
|
|
|
$headers[] = 'If-None-Match: '.$this->etag;
|
2016-12-26 17:32:18 -05:00
|
|
|
$headers[] = 'A-IM: feed';
|
2014-05-20 14:20:27 -04:00
|
|
|
}
|
|
|
|
|
|
|
|
if ($this->last_modified) {
|
|
|
|
$headers[] = 'If-Modified-Since: '.$this->last_modified;
|
|
|
|
}
|
2013-07-16 19:54:44 -04:00
|
|
|
|
2014-10-19 14:42:31 -04:00
|
|
|
if ($this->proxy_username) {
|
|
|
|
$headers[] = 'Proxy-Authorization: Basic '.base64_encode($this->proxy_username.':'.$this->proxy_password);
|
|
|
|
}
|
|
|
|
|
2014-12-24 13:50:20 -05:00
|
|
|
if ($this->username && $this->password) {
|
|
|
|
$headers[] = 'Authorization: Basic '.base64_encode($this->username.':'.$this->password);
|
|
|
|
}
|
|
|
|
|
2015-04-10 20:34:48 -04:00
|
|
|
$headers = array_merge($headers, $this->request_headers);
|
|
|
|
|
2014-10-19 14:42:31 -04:00
|
|
|
return $headers;
|
|
|
|
}
|
|
|
|
|
2015-02-01 14:48:05 -05:00
|
|
|
/**
|
2015-10-19 22:49:30 -04:00
|
|
|
* Construct the final URL from location headers.
|
2015-02-01 14:48:05 -05:00
|
|
|
*
|
2015-10-19 22:49:30 -04:00
|
|
|
* @param array $headers List of HTTP response header
|
2015-02-01 14:48:05 -05:00
|
|
|
*/
|
|
|
|
private function setEffectiveUrl($headers)
|
|
|
|
{
|
2015-10-19 22:49:30 -04:00
|
|
|
foreach ($headers as $header) {
|
2015-02-01 14:48:05 -05:00
|
|
|
if (stripos($header, 'Location') === 0) {
|
2015-06-21 09:56:36 -04:00
|
|
|
list(, $value) = explode(': ', $header);
|
2015-02-01 14:48:05 -05:00
|
|
|
|
|
|
|
$this->url = Url::resolve($value, $this->url);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2014-10-19 14:42:31 -04:00
|
|
|
/**
|
2015-10-19 22:49:30 -04:00
|
|
|
* Prepare stream context.
|
2014-10-19 14:42:31 -04:00
|
|
|
*
|
|
|
|
* @return array
|
|
|
|
*/
|
|
|
|
private function prepareContext()
|
|
|
|
{
|
|
|
|
$context = array(
|
2013-07-16 19:54:44 -04:00
|
|
|
'http' => array(
|
|
|
|
'method' => 'GET',
|
|
|
|
'protocol_version' => 1.1,
|
|
|
|
'timeout' => $this->timeout,
|
2015-02-01 14:48:05 -05:00
|
|
|
'max_redirects' => $this->max_redirects,
|
2015-10-19 22:49:30 -04:00
|
|
|
),
|
2013-07-16 19:54:44 -04:00
|
|
|
);
|
|
|
|
|
2014-05-20 14:20:27 -04:00
|
|
|
if ($this->proxy_hostname) {
|
2014-12-23 21:28:26 -05:00
|
|
|
Logger::setMessage(get_called_class().' Proxy: '.$this->proxy_hostname.':'.$this->proxy_port);
|
2014-05-20 14:20:27 -04:00
|
|
|
|
2014-10-19 14:42:31 -04:00
|
|
|
$context['http']['proxy'] = 'tcp://'.$this->proxy_hostname.':'.$this->proxy_port;
|
|
|
|
$context['http']['request_fulluri'] = true;
|
2013-09-23 19:22:13 -04:00
|
|
|
|
2014-05-20 14:20:27 -04:00
|
|
|
if ($this->proxy_username) {
|
2014-12-23 21:28:26 -05:00
|
|
|
Logger::setMessage(get_called_class().' Proxy credentials: Yes');
|
2015-10-19 22:49:30 -04:00
|
|
|
} else {
|
2014-12-23 21:28:26 -05:00
|
|
|
Logger::setMessage(get_called_class().' Proxy credentials: No');
|
2014-05-20 14:20:27 -04:00
|
|
|
}
|
2013-09-23 19:22:13 -04:00
|
|
|
}
|
|
|
|
|
2014-10-19 14:42:31 -04:00
|
|
|
$context['http']['header'] = implode("\r\n", $this->prepareHeaders());
|
|
|
|
|
|
|
|
return $context;
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
2015-10-19 22:49:30 -04:00
|
|
|
* Do the HTTP request.
|
2014-10-19 14:42:31 -04:00
|
|
|
*
|
2015-10-19 22:49:30 -04:00
|
|
|
* @return array HTTP response ['body' => ..., 'status' => ..., 'headers' => ...]
|
2016-12-26 17:32:18 -05:00
|
|
|
* @throws InvalidUrlException
|
|
|
|
* @throws MaxSizeException
|
|
|
|
* @throws TimeoutException
|
2014-10-19 14:42:31 -04:00
|
|
|
*/
|
2015-02-01 14:48:05 -05:00
|
|
|
public function doRequest()
|
2014-10-19 14:42:31 -04:00
|
|
|
{
|
2015-02-05 21:16:34 -05:00
|
|
|
$body = '';
|
|
|
|
|
2014-10-19 14:42:31 -04:00
|
|
|
// Create context
|
|
|
|
$context = stream_context_create($this->prepareContext());
|
2013-07-16 19:54:44 -04:00
|
|
|
|
|
|
|
// Make HTTP request
|
|
|
|
$stream = @fopen($this->url, 'r', false, $context);
|
2015-10-19 22:49:30 -04:00
|
|
|
if (!is_resource($stream)) {
|
2014-12-23 21:28:26 -05:00
|
|
|
throw new InvalidUrlException('Unable to establish a connection');
|
2014-10-19 14:42:31 -04:00
|
|
|
}
|
2013-07-16 19:54:44 -04:00
|
|
|
|
|
|
|
// Get HTTP headers response
|
|
|
|
$metadata = stream_get_meta_data($stream);
|
2015-02-05 21:16:34 -05:00
|
|
|
list($status, $headers) = HttpHeaders::parse($metadata['wrapper_data']);
|
2013-07-16 19:54:44 -04:00
|
|
|
|
2015-02-05 21:16:34 -05:00
|
|
|
if ($this->isPassthroughEnabled()) {
|
|
|
|
header(':', true, $status);
|
|
|
|
|
|
|
|
if (isset($headers['Content-Type'])) {
|
|
|
|
header('Content-Type: '.$headers['Content-Type']);
|
|
|
|
}
|
2015-02-01 14:48:05 -05:00
|
|
|
|
2015-02-05 21:16:34 -05:00
|
|
|
fpassthru($stream);
|
2015-10-19 22:49:30 -04:00
|
|
|
} else {
|
2015-02-05 21:16:34 -05:00
|
|
|
// Get the entire body until the max size
|
|
|
|
$body = stream_get_contents($stream, $this->max_body_size + 1);
|
2014-12-23 21:28:26 -05:00
|
|
|
|
2015-02-05 21:16:34 -05:00
|
|
|
// If the body size is too large abort everything
|
|
|
|
if (strlen($body) > $this->max_body_size) {
|
|
|
|
throw new MaxSizeException('Content size too large');
|
|
|
|
}
|
2013-07-16 19:54:44 -04:00
|
|
|
|
2015-02-05 21:16:34 -05:00
|
|
|
if ($metadata['timed_out']) {
|
|
|
|
throw new TimeoutException('Operation timeout');
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
fclose($stream);
|
|
|
|
|
|
|
|
$this->setEffectiveUrl($metadata['wrapper_data']);
|
2015-01-27 20:13:16 -05:00
|
|
|
|
2014-10-19 14:42:31 -04:00
|
|
|
return array(
|
|
|
|
'status' => $status,
|
|
|
|
'body' => $this->decodeBody($body, $headers),
|
2015-10-19 22:49:30 -04:00
|
|
|
'headers' => $headers,
|
2014-10-19 14:42:31 -04:00
|
|
|
);
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
2015-10-19 22:49:30 -04:00
|
|
|
* Decode body response according to the HTTP headers.
|
|
|
|
*
|
|
|
|
* @param string $body Raw body
|
|
|
|
* @param HttpHeaders $headers HTTP headers
|
2014-10-19 14:42:31 -04:00
|
|
|
*
|
|
|
|
* @return string
|
|
|
|
*/
|
2014-12-23 21:28:26 -05:00
|
|
|
public function decodeBody($body, HttpHeaders $headers)
|
2014-10-19 14:42:31 -04:00
|
|
|
{
|
2013-11-12 22:31:04 -05:00
|
|
|
if (isset($headers['Transfer-Encoding']) && $headers['Transfer-Encoding'] === 'chunked') {
|
|
|
|
$body = $this->decodeChunked($body);
|
|
|
|
}
|
|
|
|
|
2014-03-16 21:35:57 -04:00
|
|
|
if (isset($headers['Content-Encoding']) && $headers['Content-Encoding'] === 'gzip') {
|
2015-10-19 22:49:30 -04:00
|
|
|
$body = gzdecode($body);
|
2014-03-16 21:35:57 -04:00
|
|
|
}
|
|
|
|
|
2014-10-19 14:42:31 -04:00
|
|
|
return $body;
|
2013-07-16 19:54:44 -04:00
|
|
|
}
|
2013-11-12 22:31:04 -05:00
|
|
|
|
2014-03-16 21:35:57 -04:00
|
|
|
/**
|
2015-10-19 22:49:30 -04:00
|
|
|
* Decode a chunked body.
|
|
|
|
*
|
|
|
|
* @param string $str Raw body
|
2014-03-16 21:35:57 -04:00
|
|
|
*
|
2015-10-19 22:49:30 -04:00
|
|
|
* @return string Decoded body
|
2014-03-16 21:35:57 -04:00
|
|
|
*/
|
2013-11-12 22:31:04 -05:00
|
|
|
public function decodeChunked($str)
|
|
|
|
{
|
2015-10-19 22:49:30 -04:00
|
|
|
for ($result = ''; !empty($str); $str = trim($str)) {
|
2013-11-12 22:31:04 -05:00
|
|
|
|
|
|
|
// Get the chunk length
|
|
|
|
$pos = strpos($str, "\r\n");
|
|
|
|
$len = hexdec(substr($str, 0, $pos));
|
|
|
|
|
|
|
|
// Append the chunk to the result
|
|
|
|
$result .= substr($str, $pos + 2, $len);
|
|
|
|
$str = substr($str, $pos + 2 + $len);
|
|
|
|
}
|
|
|
|
|
|
|
|
return $result;
|
|
|
|
}
|
2014-03-16 21:35:57 -04:00
|
|
|
}
|