diff --git a/lib/Client.php b/lib/Client.php index b79c564..7c01ac5 100644 --- a/lib/Client.php +++ b/lib/Client.php @@ -26,7 +26,7 @@ * request before it's done, such as adding authentication headers. * * The afterRequest event will be emitted after the request is completed - * succesfully. + * successfully. * * If a HTTP error is returned (status code higher than 399) the error event is * triggered. It's possible using this event to retry the request, by setting @@ -45,15 +45,22 @@ */ class Client extends EventEmitter { + const STATUS_SUCCESS = 0; + const STATUS_CURLERROR = 1; + const STATUS_HTTPERROR = 2; + /** * List of curl settings. * * @var array */ - protected $curlSettings = []; + protected $curlSettings = [ + CURLOPT_NOBODY => false, + CURLOPT_USERAGENT => 'sabre-http/'.Version::VERSION.' (http://sabre.io/)', + ]; /** - * Wether or not exceptions should be thrown when a HTTP error is returned. + * Whether or not exceptions should be thrown when a HTTP error is returned. * * @var bool */ @@ -66,30 +73,53 @@ class Client extends EventEmitter */ protected $maxRedirects = 5; + /** + * The maximum size of in-memory cache per request. If this value is exceeded, the cache is transferred to a + * temporary file. + * + * @var int + */ + protected $maxMemorySize = 2 * 1024 * 1024; + protected $headerLinesMap = []; + protected $responseResourcesMap = []; + + /** + * Cached curl handle. + * + * By keeping this resource around for the lifetime of this object, things + * like persistent connections are possible. + * + * @var resource|\CurlHandle + */ + private $curlHandle; + + /** + * Handler for curl_multi requests. + * + * The first time sendAsync is used, this will be created. + * + * @var resource|\CurlMultiHandle + */ + private $curlMultiHandle; + /** - * Initializes the client. + * Has a list of curl handles, as well as their associated success and + * error callbacks. + * + * @var array + */ + private $curlMultiMap = []; + + /** + * Reserved for backward compatibility. */ public function __construct() { - // See https://github.com/sabre-io/http/pull/115#discussion_r241292068 - // Preserve compatibility for sub-classes that implements their own method `parseCurlResult` - $separatedHeaders = __CLASS__ === get_class($this); - - $this->curlSettings = [ - CURLOPT_RETURNTRANSFER => true, - CURLOPT_NOBODY => false, - CURLOPT_USERAGENT => 'sabre-http/'.Version::VERSION.' (http://sabre.io/)', - ]; - if ($separatedHeaders) { - $this->curlSettings[CURLOPT_HEADERFUNCTION] = [$this, 'receiveCurlHeader']; - } else { - $this->curlSettings[CURLOPT_HEADER] = true; - } } - protected function receiveCurlHeader($curlHandle, $headerLine) + protected function receiveCurlHeader($curlHandle, $headerLine): int { $this->headerLinesMap[(int) $curlHandle][] = $headerLine; @@ -197,32 +227,29 @@ public function poll(): bool } do { - $r = curl_multi_exec( - $this->curlMultiHandle, - $stillRunning - ); + $r = curl_multi_exec($this->curlMultiHandle, $stillRunning); } while (CURLM_CALL_MULTI_PERFORM === $r); $messagesInQueue = 0; do { - messageQueue: + $status = curl_multi_info_read($this->curlMultiHandle, $messagesInQueue); - $status = curl_multi_info_read( - $this->curlMultiHandle, - $messagesInQueue - ); + if (false !== $status && CURLMSG_DONE === $status['msg']) { + $curlHandle = $status['handle']; + $handleId = (int) $curlHandle; + [$request, $successCallback, $errorCallback, $retryCount] = $this->curlMultiMap[$handleId]; - if ($status && CURLMSG_DONE === $status['msg']) { - $resourceId = (int) $status['handle']; - list( - $request, - $successCallback, - $errorCallback, - $retryCount) = $this->curlMultiMap[$resourceId]; - unset($this->curlMultiMap[$resourceId]); + $curlResult = $this->parseCurlResource($curlHandle); + + // Cleanup + curl_multi_remove_handle($this->curlMultiHandle, $curlHandle); + curl_close($curlHandle); + unset( + $this->curlMultiMap[$handleId], + $this->responseResourcesMap[$handleId], + $this->headerLinesMap[$handleId] + ); - $curlHandle = $status['handle']; - $curlResult = $this->parseResponse(curl_multi_getcontent($curlHandle), $curlHandle); $retry = false; if (self::STATUS_CURLERROR === $curlResult['status']) { @@ -232,7 +259,7 @@ public function poll(): bool if ($retry) { ++$retryCount; $this->sendAsyncInternal($request, $successCallback, $errorCallback, $retryCount); - goto messageQueue; + continue; } $curlResult['request'] = $request; @@ -247,7 +274,7 @@ public function poll(): bool if ($retry) { ++$retryCount; $this->sendAsyncInternal($request, $successCallback, $errorCallback, $retryCount); - goto messageQueue; + continue; } $curlResult['request'] = $request; @@ -312,17 +339,15 @@ public function addCurlSetting(int $name, $value) */ protected function doRequest(RequestInterface $request): ResponseInterface { - $settings = $this->createCurlSettingsArray($request); - if (!$this->curlHandle) { $this->curlHandle = curl_init(); } else { curl_reset($this->curlHandle); } - curl_setopt_array($this->curlHandle, $settings); - $response = $this->curlExec($this->curlHandle); - $response = $this->parseResponse($response, $this->curlHandle); + $this->prepareCurl($request, $this->curlHandle); + $this->curlExecInternal($this->curlHandle); + $response = $this->parseCurlResource($this->curlHandle); if (self::STATUS_CURLERROR === $response['status']) { throw new ClientException($response['curl_errmsg'], $response['curl_errno']); } @@ -330,33 +355,6 @@ protected function doRequest(RequestInterface $request): ResponseInterface return $response['response']; } - /** - * Cached curl handle. - * - * By keeping this resource around for the lifetime of this object, things - * like persistent connections are possible. - * - * @var resource - */ - private $curlHandle; - - /** - * Handler for curl_multi requests. - * - * The first time sendAsync is used, this will be created. - * - * @var resource - */ - private $curlMultiHandle; - - /** - * Has a list of curl handles, as well as their associated success and - * error callbacks. - * - * @var array - */ - private $curlMultiMap = []; - /** * Turns a RequestInterface object into an array with settings that can be * fed to curl_setopt. @@ -411,28 +409,61 @@ protected function createCurlSettingsArray(RequestInterface $request): array return $settings; } - const STATUS_SUCCESS = 0; - const STATUS_CURLERROR = 1; - const STATUS_HTTPERROR = 2; - - private function parseResponse(string $response, $curlHandle): array + /** + * Parses the result of a curl call in a format that's a bit more + * convenient to work with. + * + * The method returns an array with the following elements: + * * status - one of the 3 STATUS constants. + * * curl_errno - A curl error number. Only set if status is + * STATUS_CURLERROR. + * * curl_errmsg - A current error message. Only set if status is + * STATUS_CURLERROR. + * * response - Response object. Only set if status is STATUS_SUCCESS, or + * STATUS_HTTPERROR. + * * http_code - HTTP status code, as an int. Only set if Only set if + * status is STATUS_SUCCESS, or STATUS_HTTPERROR + * + * @param resource|\CurlHandle $curlHandle + */ + protected function parseCurlResource($curlHandle): array { - $settings = $this->curlSettings; - $separatedHeaders = isset($settings[CURLOPT_HEADERFUNCTION]) && (bool) $settings[CURLOPT_HEADERFUNCTION]; - - if ($separatedHeaders) { - $resourceId = (int) $curlHandle; - if (isset($this->headerLinesMap[$resourceId])) { - $headers = $this->headerLinesMap[$resourceId]; - } else { - $headers = []; - } - $response = $this->parseCurlResponse($headers, $response, $curlHandle); + [$curlInfo, $curlErrNo, $curlErrMsg] = $this->curlStuff($curlHandle); + + if ($curlErrNo) { + return [ + 'status' => self::STATUS_CURLERROR, + 'curl_errno' => $curlErrNo, + 'curl_errmsg' => $curlErrMsg, + ]; + } + $handleId = (int) $curlHandle; + + $response = new Response(); + $response->setStatus($curlInfo['http_code']); + + if (isset($this->responseResourcesMap[$handleId])) { + rewind($this->responseResourcesMap[$handleId]); + $response->setBody($this->responseResourcesMap[$handleId]); } else { - $response = $this->parseCurlResult($response, $curlHandle); + $response->setBody(''); } - return $response; + $headerLines = $this->headerLinesMap[$handleId] ?? []; + foreach ($headerLines as $header) { + $parts = explode(':', $header, 2); + if (2 === count($parts)) { + $response->addHeader(trim($parts[0]), trim($parts[1])); + } + } + + $httpCode = $response->getStatus(); + + return [ + 'status' => $httpCode >= 400 ? self::STATUS_HTTPERROR : self::STATUS_SUCCESS, + 'response' => $response, + 'http_code' => $httpCode, + ]; } /** @@ -450,15 +481,13 @@ private function parseResponse(string $response, $curlHandle): array * * http_code - HTTP status code, as an int. Only set if Only set if * status is STATUS_SUCCESS, or STATUS_HTTPERROR * - * @param resource $curlHandle + * @deprecated Use parseCurlResource instead + * + * @param resource|\CurlHandle $curlHandle */ protected function parseCurlResponse(array $headerLines, string $body, $curlHandle): array { - list( - $curlInfo, - $curlErrNo, - $curlErrMsg - ) = $this->curlStuff($curlHandle); + [$curlInfo, $curlErrNo, $curlErrMsg] = $this->curlStuff($curlHandle); if ($curlErrNo) { return [ @@ -503,17 +532,13 @@ protected function parseCurlResponse(array $headerLines, string $body, $curlHand * * http_code - HTTP status code, as an int. Only set if Only set if * status is STATUS_SUCCESS, or STATUS_HTTPERROR * - * @deprecated Use parseCurlResponse instead + * @deprecated Use parseCurlResource instead * - * @param resource $curlHandle + * @param resource|\CurlHandle $curlHandle */ protected function parseCurlResult(string $response, $curlHandle): array { - list( - $curlInfo, - $curlErrNo, - $curlErrMsg - ) = $this->curlStuff($curlHandle); + [$curlInfo, $curlErrNo, $curlErrMsg] = $this->curlStuff($curlHandle); if ($curlErrNo) { return [ @@ -557,14 +582,10 @@ protected function sendAsyncInternal(RequestInterface $request, callable $succes $this->curlMultiHandle = curl_multi_init(); } $curl = curl_init(); - curl_setopt_array( - $curl, - $this->createCurlSettingsArray($request) - ); + $this->prepareCurl($request, $curl); curl_multi_add_handle($this->curlMultiHandle, $curl); $resourceId = (int) $curl; - $this->headerLinesMap[$resourceId] = []; $this->curlMultiMap[$resourceId] = [ $request, $success, @@ -573,6 +594,40 @@ protected function sendAsyncInternal(RequestInterface $request, callable $succes ]; } + /** + * @param resource|\CurlHandle $curlHandle + */ + protected function prepareCurl(RequestInterface $request, $curlHandle): void + { + $handleId = (int) $curlHandle; + $this->headerLinesMap[$handleId] = []; + $options = $this->createCurlSettingsArray($request); + + $options[CURLOPT_RETURNTRANSFER] = false; + $options[CURLOPT_HEADER] = false; + + if (!($options[CURLOPT_NOBODY] ?? false) && !array_key_exists(CURLOPT_WRITEFUNCTION, $options)) { + $options[CURLOPT_FILE] = $this->responseResourcesMap[$handleId] = $options[CURLOPT_FILE] ?? \fopen( + "php://temp/maxmemory:{$this->maxMemorySize}", + 'rw+b' + ); + } else { + $this->responseResourcesMap[$handleId] = null; + } + + $userHeaderFunction = $this->curlSettings[CURLOPT_HEADERFUNCTION] ?? null; + $options[CURLOPT_HEADERFUNCTION] = function ($curlHandle, $str) use ($userHeaderFunction) { + // Call user func + if (is_callable($userHeaderFunction)) { + $userHeaderFunction($curlHandle, $str); + } + + return $this->receiveCurlHeader($curlHandle, $str); + }; + + curl_setopt_array($curlHandle, $options); + } + // @codeCoverageIgnoreStart /** @@ -580,18 +635,34 @@ protected function sendAsyncInternal(RequestInterface $request, callable $succes * * This method exists so it can easily be overridden and mocked. * - * @param resource $curlHandle + * @param resource|\CurlHandle $curlHandle + */ + protected function curlExecInternal($curlHandle): bool + { + return curl_exec($curlHandle); + } + + /** + * Calls curl_exec and returns content string with headers. + * + * This method exists so it can easily be overridden and mocked. + * + * @param resource|\CurlHandle $curlHandle + * + * @deprecated */ protected function curlExec($curlHandle): string { - $this->headerLinesMap[(int) $curlHandle] = []; + $result = $this->curlExecInternal($curlHandle); + + $handleId = (int) $curlHandle; - $result = curl_exec($curlHandle); - if (false === $result) { - $result = ''; + if (!$result || !isset($this->responseResourcesMap[$handleId])) { + return ''; } + rewind($this->responseResourcesMap[$handleId]); - return $result; + return stream_get_contents($this->responseResourcesMap[$handleId]); } /** @@ -599,7 +670,7 @@ protected function curlExec($curlHandle): string * * This method exists so it can easily be overridden and mocked. * - * @param resource $curlHandle + * @param resource|\CurlHandle $curlHandle */ protected function curlStuff($curlHandle): array { diff --git a/tests/HTTP/ClientTest.php b/tests/HTTP/ClientTest.php index f94b9a1..844995a 100644 --- a/tests/HTTP/ClientTest.php +++ b/tests/HTTP/ClientTest.php @@ -14,8 +14,6 @@ public function testCreateCurlSettingsArrayGET() $request = new Request('GET', 'http://example.org/', ['X-Foo' => 'bar']); $settings = [ - CURLOPT_RETURNTRANSFER => true, - CURLOPT_HEADER => true, CURLOPT_POSTREDIR => 0, CURLOPT_HTTPHEADER => ['X-Foo: bar'], CURLOPT_NOBODY => false, @@ -40,8 +38,6 @@ public function testCreateCurlSettingsArrayHEAD() $request = new Request('HEAD', 'http://example.org/', ['X-Foo' => 'bar']); $settings = [ - CURLOPT_RETURNTRANSFER => true, - CURLOPT_HEADER => true, CURLOPT_NOBODY => true, CURLOPT_CUSTOMREQUEST => 'HEAD', CURLOPT_HTTPHEADER => ['X-Foo: bar'], @@ -74,8 +70,6 @@ public function testCreateCurlSettingsArrayGETAfterHEAD() $settings = [ CURLOPT_CUSTOMREQUEST => 'GET', - CURLOPT_RETURNTRANSFER => true, - CURLOPT_HEADER => true, CURLOPT_HTTPHEADER => ['X-Foo: bar'], CURLOPT_NOBODY => false, CURLOPT_URL => 'http://example.org/', @@ -101,8 +95,6 @@ public function testCreateCurlSettingsArrayPUTStream() $request = new Request('PUT', 'http://example.org/', ['X-Foo' => 'bar'], $h); $settings = [ - CURLOPT_RETURNTRANSFER => true, - CURLOPT_HEADER => true, CURLOPT_PUT => true, CURLOPT_INFILE => $h, CURLOPT_NOBODY => false, @@ -128,8 +120,6 @@ public function testCreateCurlSettingsArrayPUTString() $request = new Request('PUT', 'http://example.org/', ['X-Foo' => 'bar'], 'boo'); $settings = [ - CURLOPT_RETURNTRANSFER => true, - CURLOPT_HEADER => true, CURLOPT_NOBODY => false, CURLOPT_POSTFIELDS => 'boo', CURLOPT_CUSTOMREQUEST => 'PUT', @@ -215,6 +205,43 @@ public function testSendToGetLargeContent() $this->assertLessThan(60 * pow(1024, 2), memory_get_peak_usage()); } + /** + * @group ci + */ + public function testSendHeadHeader() + { + $url = $this->getAbsoluteUrl('/large.php'); + if (!$url) { + $this->markTestSkipped('Set an environment value BASEURL to continue'); + } + + $request = new Request('HEAD', $url); + $client = new Client(); + $response = $client->send($request); + + $this->assertEquals(200, $response->getStatus()); + $this->assertEmpty($response->getBodyAsString()); + } + + /** + * @group ci + */ + public function testSendToGetVeryLargeContent() + { + $memoryLimit = max(64, ceil($this->getMemoryLimit() / 1024 / 1024)); + $url = $this->getAbsoluteUrl("/anysize.php?size={$memoryLimit}"); + if (!$url) { + $this->markTestSkipped('Set an environment value BASEURL to continue'); + } + + $request = new Request('GET', $url); + $client = new Client(); + $response = $client->send($request); + + $this->assertEquals(200, $response->getStatus()); + $this->assertLessThan(60 * pow(1024, 2), memory_get_peak_usage()); + } + /** * @group ci */ @@ -229,7 +256,7 @@ public function testSendAsync() $request = new Request('GET', $url); $client->sendAsync($request, function (ResponseInterface $response) { - $this->assertEquals("foo\n", $response->getBody()); + $this->assertEquals("foo\n", stream_get_contents($response->getBody())); $this->assertEquals(200, $response->getStatus()); $this->assertEquals(4, $response->getHeader('Content-Length')); }, function ($error) use ($request) { @@ -243,7 +270,7 @@ public function testSendAsync() /** * @group ci */ - public function testSendAsynConsecutively() + public function testSendAsyncConsecutively() { $url = $this->getAbsoluteUrl('/foo'); if (!$url) { @@ -254,7 +281,7 @@ public function testSendAsynConsecutively() $request = new Request('GET', $url); $client->sendAsync($request, function (ResponseInterface $response) { - $this->assertEquals("foo\n", $response->getBody()); + $this->assertEquals("foo\n", $response->getBodyAsString()); $this->assertEquals(200, $response->getStatus()); $this->assertEquals(4, $response->getHeader('Content-Length')); }, function ($error) use ($request) { @@ -265,7 +292,7 @@ public function testSendAsynConsecutively() $url = $this->getAbsoluteUrl('/bar.php'); $request = new Request('GET', $url); $client->sendAsync($request, function (ResponseInterface $response) { - $this->assertEquals("bar\n", $response->getBody()); + $this->assertEquals("bar\n", $response->getBodyAsString()); $this->assertEquals(200, $response->getStatus()); $this->assertEquals('Bar', $response->getHeader('X-Test')); }, function ($error) use ($request) { @@ -434,8 +461,10 @@ public function testDoRequest() { $client = new ClientMock(); $request = new Request('GET', 'http://example.org/'); - $client->on('curlExec', function (&$return) { - $return = "HTTP/1.1 200 OK\r\nHeader1:Val1\r\n\r\nFoo"; + $client->on('curlExecInternal', function (&$return, string &$headers, string &$body) { + $return = true; + $body = 'Foo'; + $headers = "HTTP/1.1 200 OK\r\nHeader1:Val1\r\n\r\n"; }); $client->on('curlStuff', function (&$return) { $return = [ @@ -457,8 +486,8 @@ public function testDoRequestCurlError() { $client = new ClientMock(); $request = new Request('GET', 'http://example.org/'); - $client->on('curlExec', function (&$return) { - $return = ''; + $client->on('curlExecInternal', function (&$return, string &$headers, string &$body) { + $return = false; }); $client->on('curlStuff', function (&$return) { $return = [ @@ -476,6 +505,28 @@ public function testDoRequestCurlError() $this->assertEquals('Curl error', $e->getMessage()); } } + + private function getMemoryLimit(): int + { + $val = trim(ini_get('memory_limit')); + $last = strtolower($val[strlen($val) - 1]); + $val = substr($val, 0, -1); + if (!is_numeric($val) || is_numeric($last)) { + return PHP_INT_MAX; + } + switch ($last) { + case 'g': + $val *= 1024; + // no break + case 'm': + $val *= 1024; + // no break + case 'k': + $val *= 1024; + } + + return $val; + } } class ClientMock extends Client @@ -485,7 +536,7 @@ class ClientMock extends Client /** * Making this method public. */ - public function receiveCurlHeader($curlHandle, $headerLine) + public function receiveCurlHeader($curlHandle, $headerLine): int { return parent::receiveCurlHeader($curlHandle, $headerLine); } @@ -543,22 +594,36 @@ protected function curlStuff($curlHandle): array } /** - * Calls curl_exec. - * - * This method exists so it can easily be overridden and mocked. - * * @param resource $curlHandle */ - protected function curlExec($curlHandle): string + protected function curlExecInternal($curlHandle): bool { $return = null; - $this->emit('curlExec', [&$return]); + $headers = ''; + $body = ''; + $this->emit('curlExecInternal', [&$return, &$headers, &$body]); // If nothing modified $return, we're using the default behavior. if (is_null($return)) { - return parent::curlExec($curlHandle); + return parent::curlExecInternal($curlHandle); } else { + $this->parseHeadersBlock($curlHandle, $headers); + $stream = \fopen('php://memory', 'rw+'); + if (strlen($body) > 0) { + fwrite($stream, $body); + rewind($stream); + } + $this->responseResourcesMap[(int) $curlHandle] = $stream; + return $return; } } + + protected function parseHeadersBlock($curlHandle, string $str): void + { + $headerBlob = explode("\r\n", trim($str, "\r\n")); + foreach ($headerBlob as $headerLine) { + $this->receiveCurlHeader($curlHandle, $headerLine); + } + } } diff --git a/tests/www/anysize.php b/tests/www/anysize.php new file mode 100644 index 0000000..4a16508 --- /dev/null +++ b/tests/www/anysize.php @@ -0,0 +1,19 @@ + $chunk; + } +}; + +foreach ($generator(512 * 1024, $megabytes * 2) as $value) { + echo $value; +}