[ Index ]

PHP Cross Reference of WordPress Trunk (Updated Daily)

Search

title

Body

[close]

/wp-includes/SimplePie/src/HTTP/ -> Parser.php (source)

   1  <?php
   2  
   3  /**
   4   * SimplePie
   5   *
   6   * A PHP-Based RSS and Atom Feed Framework.
   7   * Takes the hard work out of managing a complete RSS/Atom solution.
   8   *
   9   * Copyright (c) 2004-2022, Ryan Parman, Sam Sneddon, Ryan McCue, and contributors
  10   * All rights reserved.
  11   *
  12   * Redistribution and use in source and binary forms, with or without modification, are
  13   * permitted provided that the following conditions are met:
  14   *
  15   *     * Redistributions of source code must retain the above copyright notice, this list of
  16   *       conditions and the following disclaimer.
  17   *
  18   *     * Redistributions in binary form must reproduce the above copyright notice, this list
  19   *       of conditions and the following disclaimer in the documentation and/or other materials
  20   *       provided with the distribution.
  21   *
  22   *     * Neither the name of the SimplePie Team nor the names of its contributors may be used
  23   *       to endorse or promote products derived from this software without specific prior
  24   *       written permission.
  25   *
  26   * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS
  27   * OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY
  28   * AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDERS
  29   * AND CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
  30   * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
  31   * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
  32   * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
  33   * OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
  34   * POSSIBILITY OF SUCH DAMAGE.
  35   *
  36   * @package SimplePie
  37   * @copyright 2004-2016 Ryan Parman, Sam Sneddon, Ryan McCue
  38   * @author Ryan Parman
  39   * @author Sam Sneddon
  40   * @author Ryan McCue
  41   * @link http://simplepie.org/ SimplePie
  42   * @license http://www.opensource.org/licenses/bsd-license.php BSD License
  43   */
  44  
  45  namespace SimplePie\HTTP;
  46  
  47  /**
  48   * HTTP Response Parser
  49   *
  50   * @package SimplePie
  51   * @subpackage HTTP
  52   */
  53  class Parser
  54  {
  55      /**
  56       * HTTP Version
  57       *
  58       * @var float
  59       */
  60      public $http_version = 0.0;
  61  
  62      /**
  63       * Status code
  64       *
  65       * @var int
  66       */
  67      public $status_code = 0;
  68  
  69      /**
  70       * Reason phrase
  71       *
  72       * @var string
  73       */
  74      public $reason = '';
  75  
  76      /**
  77       * Key/value pairs of the headers
  78       *
  79       * @var array
  80       */
  81      public $headers = [];
  82  
  83      /**
  84       * Body of the response
  85       *
  86       * @var string
  87       */
  88      public $body = '';
  89  
  90      private const STATE_HTTP_VERSION = 'http_version';
  91  
  92      private const STATE_STATUS = 'status';
  93  
  94      private const STATE_REASON = 'reason';
  95  
  96      private const STATE_NEW_LINE = 'new_line';
  97  
  98      private const STATE_BODY = 'body';
  99  
 100      private const STATE_NAME = 'name';
 101  
 102      private const STATE_VALUE = 'value';
 103  
 104      private const STATE_VALUE_CHAR = 'value_char';
 105  
 106      private const STATE_QUOTE = 'quote';
 107  
 108      private const STATE_QUOTE_ESCAPED = 'quote_escaped';
 109  
 110      private const STATE_QUOTE_CHAR = 'quote_char';
 111  
 112      private const STATE_CHUNKED = 'chunked';
 113  
 114      private const STATE_EMIT = 'emit';
 115  
 116      private const STATE_ERROR = false;
 117  
 118      /**
 119       * Current state of the state machine
 120       *
 121       * @var self::STATE_*
 122       */
 123      protected $state = self::STATE_HTTP_VERSION;
 124  
 125      /**
 126       * Input data
 127       *
 128       * @var string
 129       */
 130      protected $data = '';
 131  
 132      /**
 133       * Input data length (to avoid calling strlen() everytime this is needed)
 134       *
 135       * @var int
 136       */
 137      protected $data_length = 0;
 138  
 139      /**
 140       * Current position of the pointer
 141       *
 142       * @var int
 143       */
 144      protected $position = 0;
 145  
 146      /**
 147       * Name of the hedaer currently being parsed
 148       *
 149       * @var string
 150       */
 151      protected $name = '';
 152  
 153      /**
 154       * Value of the hedaer currently being parsed
 155       *
 156       * @var string
 157       */
 158      protected $value = '';
 159  
 160      /**
 161       * Create an instance of the class with the input data
 162       *
 163       * @param string $data Input data
 164       */
 165      public function __construct($data)
 166      {
 167          $this->data = $data;
 168          $this->data_length = strlen($this->data);
 169      }
 170  
 171      /**
 172       * Parse the input data
 173       *
 174       * @return bool true on success, false on failure
 175       */
 176      public function parse()
 177      {
 178          while ($this->state && $this->state !== self::STATE_EMIT && $this->has_data()) {
 179              $state = $this->state;
 180              $this->$state();
 181          }
 182          $this->data = '';
 183          if ($this->state === self::STATE_EMIT || $this->state === self::STATE_BODY) {
 184              return true;
 185          }
 186  
 187          $this->http_version = '';
 188          $this->status_code = 0;
 189          $this->reason = '';
 190          $this->headers = [];
 191          $this->body = '';
 192          return false;
 193      }
 194  
 195      /**
 196       * Check whether there is data beyond the pointer
 197       *
 198       * @return bool true if there is further data, false if not
 199       */
 200      protected function has_data()
 201      {
 202          return (bool) ($this->position < $this->data_length);
 203      }
 204  
 205      /**
 206       * See if the next character is LWS
 207       *
 208       * @return bool true if the next character is LWS, false if not
 209       */
 210      protected function is_linear_whitespace()
 211      {
 212          return (bool) ($this->data[$this->position] === "\x09"
 213              || $this->data[$this->position] === "\x20"
 214              || ($this->data[$this->position] === "\x0A"
 215                  && isset($this->data[$this->position + 1])
 216                  && ($this->data[$this->position + 1] === "\x09" || $this->data[$this->position + 1] === "\x20")));
 217      }
 218  
 219      /**
 220       * Parse the HTTP version
 221       */
 222      protected function http_version()
 223      {
 224          if (strpos($this->data, "\x0A") !== false && strtoupper(substr($this->data, 0, 5)) === 'HTTP/') {
 225              $len = strspn($this->data, '0123456789.', 5);
 226              $this->http_version = substr($this->data, 5, $len);
 227              $this->position += 5 + $len;
 228              if (substr_count($this->http_version, '.') <= 1) {
 229                  $this->http_version = (float) $this->http_version;
 230                  $this->position += strspn($this->data, "\x09\x20", $this->position);
 231                  $this->state = self::STATE_STATUS;
 232              } else {
 233                  $this->state = self::STATE_ERROR;
 234              }
 235          } else {
 236              $this->state = self::STATE_ERROR;
 237          }
 238      }
 239  
 240      /**
 241       * Parse the status code
 242       */
 243      protected function status()
 244      {
 245          if ($len = strspn($this->data, '0123456789', $this->position)) {
 246              $this->status_code = (int) substr($this->data, $this->position, $len);
 247              $this->position += $len;
 248              $this->state = self::STATE_REASON;
 249          } else {
 250              $this->state = self::STATE_ERROR;
 251          }
 252      }
 253  
 254      /**
 255       * Parse the reason phrase
 256       */
 257      protected function reason()
 258      {
 259          $len = strcspn($this->data, "\x0A", $this->position);
 260          $this->reason = trim(substr($this->data, $this->position, $len), "\x09\x0D\x20");
 261          $this->position += $len + 1;
 262          $this->state = self::STATE_NEW_LINE;
 263      }
 264  
 265      /**
 266       * Deal with a new line, shifting data around as needed
 267       */
 268      protected function new_line()
 269      {
 270          $this->value = trim($this->value, "\x0D\x20");
 271          if ($this->name !== '' && $this->value !== '') {
 272              $this->name = strtolower($this->name);
 273              // We should only use the last Content-Type header. c.f. issue #1
 274              if (isset($this->headers[$this->name]) && $this->name !== 'content-type') {
 275                  $this->headers[$this->name] .= ', ' . $this->value;
 276              } else {
 277                  $this->headers[$this->name] = $this->value;
 278              }
 279          }
 280          $this->name = '';
 281          $this->value = '';
 282          if (substr($this->data[$this->position], 0, 2) === "\x0D\x0A") {
 283              $this->position += 2;
 284              $this->state = self::STATE_BODY;
 285          } elseif ($this->data[$this->position] === "\x0A") {
 286              $this->position++;
 287              $this->state = self::STATE_BODY;
 288          } else {
 289              $this->state = self::STATE_NAME;
 290          }
 291      }
 292  
 293      /**
 294       * Parse a header name
 295       */
 296      protected function name()
 297      {
 298          $len = strcspn($this->data, "\x0A:", $this->position);
 299          if (isset($this->data[$this->position + $len])) {
 300              if ($this->data[$this->position + $len] === "\x0A") {
 301                  $this->position += $len;
 302                  $this->state = self::STATE_NEW_LINE;
 303              } else {
 304                  $this->name = substr($this->data, $this->position, $len);
 305                  $this->position += $len + 1;
 306                  $this->state = self::STATE_VALUE;
 307              }
 308          } else {
 309              $this->state = self::STATE_ERROR;
 310          }
 311      }
 312  
 313      /**
 314       * Parse LWS, replacing consecutive LWS characters with a single space
 315       */
 316      protected function linear_whitespace()
 317      {
 318          do {
 319              if (substr($this->data, $this->position, 2) === "\x0D\x0A") {
 320                  $this->position += 2;
 321              } elseif ($this->data[$this->position] === "\x0A") {
 322                  $this->position++;
 323              }
 324              $this->position += strspn($this->data, "\x09\x20", $this->position);
 325          } while ($this->has_data() && $this->is_linear_whitespace());
 326          $this->value .= "\x20";
 327      }
 328  
 329      /**
 330       * See what state to move to while within non-quoted header values
 331       */
 332      protected function value()
 333      {
 334          if ($this->is_linear_whitespace()) {
 335              $this->linear_whitespace();
 336          } else {
 337              switch ($this->data[$this->position]) {
 338                  case '"':
 339                      // Workaround for ETags: we have to include the quotes as
 340                      // part of the tag.
 341                      if (strtolower($this->name) === 'etag') {
 342                          $this->value .= '"';
 343                          $this->position++;
 344                          $this->state = self::STATE_VALUE_CHAR;
 345                          break;
 346                      }
 347                      $this->position++;
 348                      $this->state = self::STATE_QUOTE;
 349                      break;
 350  
 351                  case "\x0A":
 352                      $this->position++;
 353                      $this->state = self::STATE_NEW_LINE;
 354                      break;
 355  
 356                  default:
 357                      $this->state = self::STATE_VALUE_CHAR;
 358                      break;
 359              }
 360          }
 361      }
 362  
 363      /**
 364       * Parse a header value while outside quotes
 365       */
 366      protected function value_char()
 367      {
 368          $len = strcspn($this->data, "\x09\x20\x0A\"", $this->position);
 369          $this->value .= substr($this->data, $this->position, $len);
 370          $this->position += $len;
 371          $this->state = self::STATE_VALUE;
 372      }
 373  
 374      /**
 375       * See what state to move to while within quoted header values
 376       */
 377      protected function quote()
 378      {
 379          if ($this->is_linear_whitespace()) {
 380              $this->linear_whitespace();
 381          } else {
 382              switch ($this->data[$this->position]) {
 383                  case '"':
 384                      $this->position++;
 385                      $this->state = self::STATE_VALUE;
 386                      break;
 387  
 388                  case "\x0A":
 389                      $this->position++;
 390                      $this->state = self::STATE_NEW_LINE;
 391                      break;
 392  
 393                  case '\\':
 394                      $this->position++;
 395                      $this->state = self::STATE_QUOTE_ESCAPED;
 396                      break;
 397  
 398                  default:
 399                      $this->state = self::STATE_QUOTE_CHAR;
 400                      break;
 401              }
 402          }
 403      }
 404  
 405      /**
 406       * Parse a header value while within quotes
 407       */
 408      protected function quote_char()
 409      {
 410          $len = strcspn($this->data, "\x09\x20\x0A\"\\", $this->position);
 411          $this->value .= substr($this->data, $this->position, $len);
 412          $this->position += $len;
 413          $this->state = self::STATE_VALUE;
 414      }
 415  
 416      /**
 417       * Parse an escaped character within quotes
 418       */
 419      protected function quote_escaped()
 420      {
 421          $this->value .= $this->data[$this->position];
 422          $this->position++;
 423          $this->state = self::STATE_QUOTE;
 424      }
 425  
 426      /**
 427       * Parse the body
 428       */
 429      protected function body()
 430      {
 431          $this->body = substr($this->data, $this->position);
 432          if (!empty($this->headers['transfer-encoding'])) {
 433              unset($this->headers['transfer-encoding']);
 434              $this->state = self::STATE_CHUNKED;
 435          } else {
 436              $this->state = self::STATE_EMIT;
 437          }
 438      }
 439  
 440      /**
 441       * Parsed a "Transfer-Encoding: chunked" body
 442       */
 443      protected function chunked()
 444      {
 445          if (!preg_match('/^([0-9a-f]+)[^\r\n]*\r\n/i', trim($this->body))) {
 446              $this->state = self::STATE_EMIT;
 447              return;
 448          }
 449  
 450          $decoded = '';
 451          $encoded = $this->body;
 452  
 453          while (true) {
 454              $is_chunked = (bool) preg_match('/^([0-9a-f]+)[^\r\n]*\r\n/i', $encoded, $matches);
 455              if (!$is_chunked) {
 456                  // Looks like it's not chunked after all
 457                  $this->state = self::STATE_EMIT;
 458                  return;
 459              }
 460  
 461              $length = hexdec(trim($matches[1]));
 462              if ($length === 0) {
 463                  // Ignore trailer headers
 464                  $this->state = self::STATE_EMIT;
 465                  $this->body = $decoded;
 466                  return;
 467              }
 468  
 469              $chunk_length = strlen($matches[0]);
 470              $decoded .= substr($encoded, $chunk_length, $length);
 471              $encoded = substr($encoded, $chunk_length + $length + 2);
 472  
 473              // BC for PHP < 8.0: substr() can return bool instead of string
 474              $encoded = ($encoded === false) ? '' : $encoded;
 475  
 476              if (trim($encoded) === '0' || empty($encoded)) {
 477                  $this->state = self::STATE_EMIT;
 478                  $this->body = $decoded;
 479                  return;
 480              }
 481          }
 482      }
 483  
 484      /**
 485       * Prepare headers (take care of proxies headers)
 486       *
 487       * @param string  $headers Raw headers
 488       * @param integer $count   Redirection count. Default to 1.
 489       *
 490       * @return string
 491       */
 492      public static function prepareHeaders($headers, $count = 1)
 493      {
 494          $data = explode("\r\n\r\n", $headers, $count);
 495          $data = array_pop($data);
 496          if (false !== stripos($data, "HTTP/1.0 200 Connection established\r\n")) {
 497              $exploded = explode("\r\n\r\n", $data, 2);
 498              $data = end($exploded);
 499          }
 500          if (false !== stripos($data, "HTTP/1.1 200 Connection established\r\n")) {
 501              $exploded = explode("\r\n\r\n", $data, 2);
 502              $data = end($exploded);
 503          }
 504          return $data;
 505      }
 506  }
 507  
 508  class_alias('SimplePie\HTTP\Parser', 'SimplePie_HTTP_Parser');


Generated : Thu Nov 21 08:20:01 2024 Cross-referenced by PHPXref