diff options
Diffstat (limited to 'lib/simplepie/simplepie/src/File.php')
| -rw-r--r-- | lib/simplepie/simplepie/src/File.php | 75 |
1 files changed, 53 insertions, 22 deletions
diff --git a/lib/simplepie/simplepie/src/File.php b/lib/simplepie/simplepie/src/File.php index 93c943624..4a8cb157c 100644 --- a/lib/simplepie/simplepie/src/File.php +++ b/lib/simplepie/simplepie/src/File.php @@ -57,7 +57,7 @@ class File implements Response */ public $status_code = 0; - /** @var int Number of redirect that were already performed during this request sequence. */ + /** @var non-negative-int Number of redirect that were already performed during this request sequence. */ public $redirects = 0; /** @var ?string */ @@ -91,7 +91,7 @@ class File implements Response if (function_exists('idn_to_ascii')) { $parsed = \SimplePie\Misc::parse_url($url); if ($parsed['authority'] !== '' && !ctype_print($parsed['authority'])) { - $authority = \idn_to_ascii($parsed['authority'], \IDNA_NONTRANSITIONAL_TO_ASCII, \INTL_IDNA_VARIANT_UTS46); + $authority = (string) \idn_to_ascii($parsed['authority'], \IDNA_NONTRANSITIONAL_TO_ASCII, \INTL_IDNA_VARIANT_UTS46); $url = \SimplePie\Misc::compress_parse_url($parsed['scheme'], $authority, $parsed['path'], $parsed['query'], null); } } @@ -102,7 +102,7 @@ class File implements Response $this->useragent = $useragent; if (preg_match('/^http(s)?:\/\//i', $url)) { if ($useragent === null) { - $useragent = ini_get('user_agent'); + $useragent = (string) ini_get('user_agent'); $this->useragent = $useragent; } if (!is_array($headers)) { @@ -127,7 +127,7 @@ class File implements Response curl_setopt($fp, CURLOPT_URL, $url); curl_setopt($fp, CURLOPT_HEADER, 1); curl_setopt($fp, CURLOPT_RETURNTRANSFER, 1); - // curl_setopt($fp, CURLOPT_FAILONERROR, 1); // FreshRSS removed to retrieve headers even on HTTP errors + curl_setopt($fp, CURLOPT_FAILONERROR, 1); curl_setopt($fp, CURLOPT_TIMEOUT, $timeout); curl_setopt($fp, CURLOPT_CONNECTTIMEOUT, $timeout); // curl_setopt($fp, CURLOPT_REFERER, \SimplePie\Misc::url_remove_credentials($url)); // FreshRSS removed @@ -138,10 +138,9 @@ class File implements Response } $responseHeaders = curl_exec($fp); - if (curl_errno($fp) === 23 || curl_errno($fp) === 61) { + if (curl_errno($fp) === CURLE_WRITE_ERROR || curl_errno($fp) === CURLE_BAD_CONTENT_ENCODING) { $this->error = 'cURL error ' . curl_errno($fp) . ': ' . curl_error($fp); // FreshRSS - $this->status_code = curl_getinfo($fp, CURLINFO_HTTP_CODE); // FreshRSS - $this->on_http_response($responseHeaders); + $this->on_http_response(); $this->error = null; // FreshRSS curl_setopt($fp, CURLOPT_ENCODING, 'none'); $responseHeaders = curl_exec($fp); @@ -150,15 +149,17 @@ class File implements Response if (curl_errno($fp)) { $this->error = 'cURL error ' . curl_errno($fp) . ': ' . curl_error($fp); $this->success = false; - $this->on_http_response($responseHeaders); + $this->on_http_response(); } else { - $this->on_http_response($responseHeaders); + $this->on_http_response(); // Use the updated url provided by curl_getinfo after any redirects. if ($info = curl_getinfo($fp)) { $this->url = $info['url']; } + // For PHPStan: We already checked that error did not occur. + assert(is_array($info) && $info['redirect_count'] >= 0); curl_close($fp); - $responseHeaders = \SimplePie\HTTP\Parser::prepareHeaders($responseHeaders, $info['redirect_count'] + 1); + $responseHeaders = \SimplePie\HTTP\Parser::prepareHeaders((string) $responseHeaders, $info['redirect_count'] + 1); $parser = new \SimplePie\HTTP\Parser($responseHeaders, true); if ($parser->parse()) { $this->set_headers($parser->headers); @@ -167,6 +168,11 @@ class File implements Response if ((in_array($this->status_code, [300, 301, 302, 303, 307]) || $this->status_code > 307 && $this->status_code < 400) && ($locationHeader = $this->get_header_line('location')) !== '' && $this->redirects < $redirects) { $this->redirects++; $location = \SimplePie\Misc::absolutize_url($locationHeader, $url); + if ($location === false) { + $this->error = "Invalid redirect location, trying to base “{$locationHeader}” onto “{$url}”"; + $this->success = false; + return; + } $this->permanentUrlMutable = $this->permanentUrlMutable && ($this->status_code == 301 || $this->status_code == 308); $this->__construct($location, $timeout, $redirects, $headers, $useragent, $force_fsockopen, $curl_options); return; @@ -175,10 +181,15 @@ class File implements Response } } else { $this->method = \SimplePie\SimplePie::FILE_SOURCE_REMOTE | \SimplePie\SimplePie::FILE_SOURCE_FSOCKOPEN; - $url_parts = parse_url($url); + if (($url_parts = parse_url($url)) === false) { + throw new \InvalidArgumentException('Malformed URL: ' . $url); + } + if (!isset($url_parts['host'])) { + throw new \InvalidArgumentException('Missing hostname: ' . $url); + } $socket_host = $url_parts['host']; if (isset($url_parts['scheme']) && strtolower($url_parts['scheme']) === 'https') { - $socket_host = "ssl://$url_parts[host]"; + $socket_host = 'ssl://' . $socket_host; $url_parts['port'] = 443; } if (!isset($url_parts['port'])) { @@ -188,7 +199,7 @@ class File implements Response if (!$fp) { $this->error = 'fsockopen error: ' . $errstr; $this->success = false; - $this->on_http_response(false); + $this->on_http_response(); } else { stream_set_timeout($fp, $timeout); if (isset($url_parts['path'])) { @@ -229,15 +240,21 @@ class File implements Response $this->set_headers($parser->headers); $this->body = $parser->body; $this->status_code = $parser->status_code; - $this->on_http_response($responseHeaders); + $this->on_http_response(); if ((in_array($this->status_code, [300, 301, 302, 303, 307]) || $this->status_code > 307 && $this->status_code < 400) && ($locationHeader = $this->get_header_line('location')) !== '' && $this->redirects < $redirects) { $this->redirects++; $location = \SimplePie\Misc::absolutize_url($locationHeader, $url); $this->permanentUrlMutable = $this->permanentUrlMutable && ($this->status_code == 301 || $this->status_code == 308); + if ($location === false) { + $this->error = "Invalid redirect location, trying to base “{$locationHeader}” onto “{$url}”"; + $this->success = false; + return; + } $this->__construct($location, $timeout, $redirects, $headers, $useragent, $force_fsockopen, $curl_options); return; } if (($contentEncodingHeader = $this->get_header_line('content-encoding')) !== '') { + assert($this->body !== null); // For PHPStan // FreshRSS // Hey, we act dumb elsewhere, so let's do that here too switch (strtolower(trim($contentEncodingHeader, "\x09\x0A\x0D\x20"))) { case 'gzip': @@ -271,12 +288,12 @@ class File implements Response } else { $this->error = 'Could not parse'; // FreshRSS $this->success = false; // FreshRSS - $this->on_http_response($responseHeaders); + $this->on_http_response(); } } else { $this->error = 'fsocket timed out'; $this->success = false; - $this->on_http_response($responseHeaders); + $this->on_http_response(); } fclose($fp); } @@ -291,22 +308,23 @@ class File implements Response $this->body = $filebody; $this->status_code = 200; } - $this->on_http_response($filebody); + $this->on_http_response(); } if ($this->success) { - // (Leading) whitespace may cause XML parsing errors so we trim it, - // but we must not trim \x00 to avoid breaking BOM or multibyte characters - $this->body = trim($this->body, " \n\r\t\v"); + assert($this->body !== null); // For PHPStan + // Leading whitespace may cause XML parsing errors (XML declaration cannot be preceded by anything other than BOM) so we trim it. + // Note that unlike built-in `trim` function’s default settings, we do not trim `\x00` to avoid breaking characters in UTF-16 or UTF-32 encoded strings. + // We also only do that when the whitespace is followed by `<`, so that we do not break e.g. UTF-16LE encoded whitespace like `\n\x00` in half. + $this->body = preg_replace('/^[ \n\r\t\v]+</', '<', $this->body); } } /** * Event to allow inheriting classes to e.g. log the HTTP responses. * Triggered just after an HTTP response is received. - * @param string|false $response The raw HTTP response headers and body, or false in case of failure (as returned by curl_exec()). * FreshRSS. */ - protected function on_http_response(string|false $response): void + protected function on_http_response(): void { } @@ -343,6 +361,19 @@ class File implements Response return $this->parsed_headers[strtolower($name)] ?? []; } + public function with_header(string $name, $value) + { + $this->maybe_update_headers(); + $new = clone $this; + + $newHeader = [ + strtolower($name) => (array) $value, + ]; + $new->set_headers($newHeader + $this->get_headers()); + + return $new; + } + public function get_header_line(string $name): string { $this->maybe_update_headers(); |
