[ Index ] |
PHP Cross Reference of WordPress Trunk (Updated Daily) |
[Summary view] [Print] [Text view]
1 <?php 2 3 /** 4 * SimplePie 5 * 6 * A PHP-Based RSS and Atom Feed Framework. 7 * Takes the hard work out of managing a complete RSS/Atom solution. 8 * 9 * Copyright (c) 2004-2022, Ryan Parman, Sam Sneddon, Ryan McCue, and contributors 10 * All rights reserved. 11 * 12 * Redistribution and use in source and binary forms, with or without modification, are 13 * permitted provided that the following conditions are met: 14 * 15 * * Redistributions of source code must retain the above copyright notice, this list of 16 * conditions and the following disclaimer. 17 * 18 * * Redistributions in binary form must reproduce the above copyright notice, this list 19 * of conditions and the following disclaimer in the documentation and/or other materials 20 * provided with the distribution. 21 * 22 * * Neither the name of the SimplePie Team nor the names of its contributors may be used 23 * to endorse or promote products derived from this software without specific prior 24 * written permission. 25 * 26 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS 27 * OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY 28 * AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDERS 29 * AND CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR 30 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR 31 * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 32 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR 33 * OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE 34 * POSSIBILITY OF SUCH DAMAGE. 35 * 36 * @package SimplePie 37 * @copyright 2004-2016 Ryan Parman, Sam Sneddon, Ryan McCue 38 * @author Ryan Parman 39 * @author Sam Sneddon 40 * @author Ryan McCue 41 * @link http://simplepie.org/ SimplePie 42 * @license http://www.opensource.org/licenses/bsd-license.php BSD License 43 */ 44 45 namespace SimplePie\HTTP; 46 47 /** 48 * HTTP Response Parser 49 * 50 * @package SimplePie 51 * @subpackage HTTP 52 */ 53 class Parser 54 { 55 /** 56 * HTTP Version 57 * 58 * @var float 59 */ 60 public $http_version = 0.0; 61 62 /** 63 * Status code 64 * 65 * @var int 66 */ 67 public $status_code = 0; 68 69 /** 70 * Reason phrase 71 * 72 * @var string 73 */ 74 public $reason = ''; 75 76 /** 77 * Key/value pairs of the headers 78 * 79 * @var array 80 */ 81 public $headers = []; 82 83 /** 84 * Body of the response 85 * 86 * @var string 87 */ 88 public $body = ''; 89 90 private const STATE_HTTP_VERSION = 'http_version'; 91 92 private const STATE_STATUS = 'status'; 93 94 private const STATE_REASON = 'reason'; 95 96 private const STATE_NEW_LINE = 'new_line'; 97 98 private const STATE_BODY = 'body'; 99 100 private const STATE_NAME = 'name'; 101 102 private const STATE_VALUE = 'value'; 103 104 private const STATE_VALUE_CHAR = 'value_char'; 105 106 private const STATE_QUOTE = 'quote'; 107 108 private const STATE_QUOTE_ESCAPED = 'quote_escaped'; 109 110 private const STATE_QUOTE_CHAR = 'quote_char'; 111 112 private const STATE_CHUNKED = 'chunked'; 113 114 private const STATE_EMIT = 'emit'; 115 116 private const STATE_ERROR = false; 117 118 /** 119 * Current state of the state machine 120 * 121 * @var self::STATE_* 122 */ 123 protected $state = self::STATE_HTTP_VERSION; 124 125 /** 126 * Input data 127 * 128 * @var string 129 */ 130 protected $data = ''; 131 132 /** 133 * Input data length (to avoid calling strlen() everytime this is needed) 134 * 135 * @var int 136 */ 137 protected $data_length = 0; 138 139 /** 140 * Current position of the pointer 141 * 142 * @var int 143 */ 144 protected $position = 0; 145 146 /** 147 * Name of the hedaer currently being parsed 148 * 149 * @var string 150 */ 151 protected $name = ''; 152 153 /** 154 * Value of the hedaer currently being parsed 155 * 156 * @var string 157 */ 158 protected $value = ''; 159 160 /** 161 * Create an instance of the class with the input data 162 * 163 * @param string $data Input data 164 */ 165 public function __construct($data) 166 { 167 $this->data = $data; 168 $this->data_length = strlen($this->data); 169 } 170 171 /** 172 * Parse the input data 173 * 174 * @return bool true on success, false on failure 175 */ 176 public function parse() 177 { 178 while ($this->state && $this->state !== self::STATE_EMIT && $this->has_data()) { 179 $state = $this->state; 180 $this->$state(); 181 } 182 $this->data = ''; 183 if ($this->state === self::STATE_EMIT || $this->state === self::STATE_BODY) { 184 return true; 185 } 186 187 $this->http_version = ''; 188 $this->status_code = 0; 189 $this->reason = ''; 190 $this->headers = []; 191 $this->body = ''; 192 return false; 193 } 194 195 /** 196 * Check whether there is data beyond the pointer 197 * 198 * @return bool true if there is further data, false if not 199 */ 200 protected function has_data() 201 { 202 return (bool) ($this->position < $this->data_length); 203 } 204 205 /** 206 * See if the next character is LWS 207 * 208 * @return bool true if the next character is LWS, false if not 209 */ 210 protected function is_linear_whitespace() 211 { 212 return (bool) ($this->data[$this->position] === "\x09" 213 || $this->data[$this->position] === "\x20" 214 || ($this->data[$this->position] === "\x0A" 215 && isset($this->data[$this->position + 1]) 216 && ($this->data[$this->position + 1] === "\x09" || $this->data[$this->position + 1] === "\x20"))); 217 } 218 219 /** 220 * Parse the HTTP version 221 */ 222 protected function http_version() 223 { 224 if (strpos($this->data, "\x0A") !== false && strtoupper(substr($this->data, 0, 5)) === 'HTTP/') { 225 $len = strspn($this->data, '0123456789.', 5); 226 $this->http_version = substr($this->data, 5, $len); 227 $this->position += 5 + $len; 228 if (substr_count($this->http_version, '.') <= 1) { 229 $this->http_version = (float) $this->http_version; 230 $this->position += strspn($this->data, "\x09\x20", $this->position); 231 $this->state = self::STATE_STATUS; 232 } else { 233 $this->state = self::STATE_ERROR; 234 } 235 } else { 236 $this->state = self::STATE_ERROR; 237 } 238 } 239 240 /** 241 * Parse the status code 242 */ 243 protected function status() 244 { 245 if ($len = strspn($this->data, '0123456789', $this->position)) { 246 $this->status_code = (int) substr($this->data, $this->position, $len); 247 $this->position += $len; 248 $this->state = self::STATE_REASON; 249 } else { 250 $this->state = self::STATE_ERROR; 251 } 252 } 253 254 /** 255 * Parse the reason phrase 256 */ 257 protected function reason() 258 { 259 $len = strcspn($this->data, "\x0A", $this->position); 260 $this->reason = trim(substr($this->data, $this->position, $len), "\x09\x0D\x20"); 261 $this->position += $len + 1; 262 $this->state = self::STATE_NEW_LINE; 263 } 264 265 /** 266 * Deal with a new line, shifting data around as needed 267 */ 268 protected function new_line() 269 { 270 $this->value = trim($this->value, "\x0D\x20"); 271 if ($this->name !== '' && $this->value !== '') { 272 $this->name = strtolower($this->name); 273 // We should only use the last Content-Type header. c.f. issue #1 274 if (isset($this->headers[$this->name]) && $this->name !== 'content-type') { 275 $this->headers[$this->name] .= ', ' . $this->value; 276 } else { 277 $this->headers[$this->name] = $this->value; 278 } 279 } 280 $this->name = ''; 281 $this->value = ''; 282 if (substr($this->data[$this->position], 0, 2) === "\x0D\x0A") { 283 $this->position += 2; 284 $this->state = self::STATE_BODY; 285 } elseif ($this->data[$this->position] === "\x0A") { 286 $this->position++; 287 $this->state = self::STATE_BODY; 288 } else { 289 $this->state = self::STATE_NAME; 290 } 291 } 292 293 /** 294 * Parse a header name 295 */ 296 protected function name() 297 { 298 $len = strcspn($this->data, "\x0A:", $this->position); 299 if (isset($this->data[$this->position + $len])) { 300 if ($this->data[$this->position + $len] === "\x0A") { 301 $this->position += $len; 302 $this->state = self::STATE_NEW_LINE; 303 } else { 304 $this->name = substr($this->data, $this->position, $len); 305 $this->position += $len + 1; 306 $this->state = self::STATE_VALUE; 307 } 308 } else { 309 $this->state = self::STATE_ERROR; 310 } 311 } 312 313 /** 314 * Parse LWS, replacing consecutive LWS characters with a single space 315 */ 316 protected function linear_whitespace() 317 { 318 do { 319 if (substr($this->data, $this->position, 2) === "\x0D\x0A") { 320 $this->position += 2; 321 } elseif ($this->data[$this->position] === "\x0A") { 322 $this->position++; 323 } 324 $this->position += strspn($this->data, "\x09\x20", $this->position); 325 } while ($this->has_data() && $this->is_linear_whitespace()); 326 $this->value .= "\x20"; 327 } 328 329 /** 330 * See what state to move to while within non-quoted header values 331 */ 332 protected function value() 333 { 334 if ($this->is_linear_whitespace()) { 335 $this->linear_whitespace(); 336 } else { 337 switch ($this->data[$this->position]) { 338 case '"': 339 // Workaround for ETags: we have to include the quotes as 340 // part of the tag. 341 if (strtolower($this->name) === 'etag') { 342 $this->value .= '"'; 343 $this->position++; 344 $this->state = self::STATE_VALUE_CHAR; 345 break; 346 } 347 $this->position++; 348 $this->state = self::STATE_QUOTE; 349 break; 350 351 case "\x0A": 352 $this->position++; 353 $this->state = self::STATE_NEW_LINE; 354 break; 355 356 default: 357 $this->state = self::STATE_VALUE_CHAR; 358 break; 359 } 360 } 361 } 362 363 /** 364 * Parse a header value while outside quotes 365 */ 366 protected function value_char() 367 { 368 $len = strcspn($this->data, "\x09\x20\x0A\"", $this->position); 369 $this->value .= substr($this->data, $this->position, $len); 370 $this->position += $len; 371 $this->state = self::STATE_VALUE; 372 } 373 374 /** 375 * See what state to move to while within quoted header values 376 */ 377 protected function quote() 378 { 379 if ($this->is_linear_whitespace()) { 380 $this->linear_whitespace(); 381 } else { 382 switch ($this->data[$this->position]) { 383 case '"': 384 $this->position++; 385 $this->state = self::STATE_VALUE; 386 break; 387 388 case "\x0A": 389 $this->position++; 390 $this->state = self::STATE_NEW_LINE; 391 break; 392 393 case '\\': 394 $this->position++; 395 $this->state = self::STATE_QUOTE_ESCAPED; 396 break; 397 398 default: 399 $this->state = self::STATE_QUOTE_CHAR; 400 break; 401 } 402 } 403 } 404 405 /** 406 * Parse a header value while within quotes 407 */ 408 protected function quote_char() 409 { 410 $len = strcspn($this->data, "\x09\x20\x0A\"\\", $this->position); 411 $this->value .= substr($this->data, $this->position, $len); 412 $this->position += $len; 413 $this->state = self::STATE_VALUE; 414 } 415 416 /** 417 * Parse an escaped character within quotes 418 */ 419 protected function quote_escaped() 420 { 421 $this->value .= $this->data[$this->position]; 422 $this->position++; 423 $this->state = self::STATE_QUOTE; 424 } 425 426 /** 427 * Parse the body 428 */ 429 protected function body() 430 { 431 $this->body = substr($this->data, $this->position); 432 if (!empty($this->headers['transfer-encoding'])) { 433 unset($this->headers['transfer-encoding']); 434 $this->state = self::STATE_CHUNKED; 435 } else { 436 $this->state = self::STATE_EMIT; 437 } 438 } 439 440 /** 441 * Parsed a "Transfer-Encoding: chunked" body 442 */ 443 protected function chunked() 444 { 445 if (!preg_match('/^([0-9a-f]+)[^\r\n]*\r\n/i', trim($this->body))) { 446 $this->state = self::STATE_EMIT; 447 return; 448 } 449 450 $decoded = ''; 451 $encoded = $this->body; 452 453 while (true) { 454 $is_chunked = (bool) preg_match('/^([0-9a-f]+)[^\r\n]*\r\n/i', $encoded, $matches); 455 if (!$is_chunked) { 456 // Looks like it's not chunked after all 457 $this->state = self::STATE_EMIT; 458 return; 459 } 460 461 $length = hexdec(trim($matches[1])); 462 if ($length === 0) { 463 // Ignore trailer headers 464 $this->state = self::STATE_EMIT; 465 $this->body = $decoded; 466 return; 467 } 468 469 $chunk_length = strlen($matches[0]); 470 $decoded .= substr($encoded, $chunk_length, $length); 471 $encoded = substr($encoded, $chunk_length + $length + 2); 472 473 // BC for PHP < 8.0: substr() can return bool instead of string 474 $encoded = ($encoded === false) ? '' : $encoded; 475 476 if (trim($encoded) === '0' || empty($encoded)) { 477 $this->state = self::STATE_EMIT; 478 $this->body = $decoded; 479 return; 480 } 481 } 482 } 483 484 /** 485 * Prepare headers (take care of proxies headers) 486 * 487 * @param string $headers Raw headers 488 * @param integer $count Redirection count. Default to 1. 489 * 490 * @return string 491 */ 492 public static function prepareHeaders($headers, $count = 1) 493 { 494 $data = explode("\r\n\r\n", $headers, $count); 495 $data = array_pop($data); 496 if (false !== stripos($data, "HTTP/1.0 200 Connection established\r\n")) { 497 $exploded = explode("\r\n\r\n", $data, 2); 498 $data = end($exploded); 499 } 500 if (false !== stripos($data, "HTTP/1.1 200 Connection established\r\n")) { 501 $exploded = explode("\r\n\r\n", $data, 2); 502 $data = end($exploded); 503 } 504 return $data; 505 } 506 } 507 508 class_alias('SimplePie\HTTP\Parser', 'SimplePie_HTTP_Parser');
title
Description
Body
title
Description
Body
title
Description
Body
title
Body
Generated : Tue Jan 21 08:20:01 2025 | Cross-referenced by PHPXref |