[ Index ]

PHP Cross Reference of phpwcms V1.4.3 _r380 (23.11.09)

title

Body

[close]

/include/inc_ext/JSON/ -> JSON.php (source)

   1  <?php
   2  /* vim: set expandtab tabstop=4 shiftwidth=4 softtabstop=4: */
   3  
   4  /**
   5   * Converts to and from JSON format.
   6   *
   7   * JSON (JavaScript Object Notation) is a lightweight data-interchange
   8   * format. It is easy for humans to read and write. It is easy for machines
   9   * to parse and generate. It is based on a subset of the JavaScript
  10   * Programming Language, Standard ECMA-262 3rd Edition - December 1999.
  11   * This feature can also be found in  Python. JSON is a text format that is
  12   * completely language independent but uses conventions that are familiar
  13   * to programmers of the C-family of languages, including C, C++, C#, Java,
  14   * JavaScript, Perl, TCL, and many others. These properties make JSON an
  15   * ideal data-interchange language.
  16   *
  17   * This package provides a simple encoder and decoder for JSON notation. It
  18   * is intended for use with client-side Javascript applications that make
  19   * use of HTTPRequest to perform server communication functions - data can
  20   * be encoded into JSON notation for use in a client-side javascript, or
  21   * decoded from incoming Javascript requests. JSON format is native to
  22   * Javascript, and can be directly eval()'ed with no further parsing
  23   * overhead
  24   *
  25   * All strings should be in ASCII or UTF-8 format!
  26   *
  27   * LICENSE: Redistribution and use in source and binary forms, with or
  28   * without modification, are permitted provided that the following
  29   * conditions are met: Redistributions of source code must retain the
  30   * above copyright notice, this list of conditions and the following
  31   * disclaimer. Redistributions in binary form must reproduce the above
  32   * copyright notice, this list of conditions and the following disclaimer
  33   * in the documentation and/or other materials provided with the
  34   * distribution.
  35   *
  36   * THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESS OR IMPLIED
  37   * WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
  38   * MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN
  39   * NO EVENT SHALL CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
  40   * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
  41   * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS
  42   * OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
  43   * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR
  44   * TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE
  45   * USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH
  46   * DAMAGE.
  47   *
  48   * @category
  49   * @package     Services_JSON
  50   * @author      Michal Migurski <mike-json@teczno.com>
  51   * @author      Matt Knapp <mdknapp[at]gmail[dot]com>
  52   * @author      Brett Stimmerman <brettstimmerman[at]gmail[dot]com>
  53   * @copyright   2005 Michal Migurski
  54   * @version     CVS: $Id: JSON.php,v 1.31 2006/06/28 05:54:17 migurski Exp $
  55   * @license     http://www.opensource.org/licenses/bsd-license.php
  56   * @link        http://pear.php.net/pepr/pepr-proposal-show.php?id=198
  57   */
  58  
  59  /**
  60   * Marker constant for Services_JSON::decode(), used to flag stack state
  61   */
  62  define('SERVICES_JSON_SLICE',   1);
  63  
  64  /**
  65   * Marker constant for Services_JSON::decode(), used to flag stack state
  66   */
  67  define('SERVICES_JSON_IN_STR',  2);
  68  
  69  /**
  70   * Marker constant for Services_JSON::decode(), used to flag stack state
  71   */
  72  define('SERVICES_JSON_IN_ARR',  3);
  73  
  74  /**
  75   * Marker constant for Services_JSON::decode(), used to flag stack state
  76   */
  77  define('SERVICES_JSON_IN_OBJ',  4);
  78  
  79  /**
  80   * Marker constant for Services_JSON::decode(), used to flag stack state
  81   */
  82  define('SERVICES_JSON_IN_CMT', 5);
  83  
  84  /**
  85   * Behavior switch for Services_JSON::decode()
  86   */
  87  define('SERVICES_JSON_LOOSE_TYPE', 16);
  88  
  89  /**
  90   * Behavior switch for Services_JSON::decode()
  91   */
  92  define('SERVICES_JSON_SUPPRESS_ERRORS', 32);
  93  
  94  /**
  95   * Converts to and from JSON format.
  96   *
  97   * Brief example of use:
  98   *
  99   * <code>
 100   * // create a new instance of Services_JSON
 101   * $json = new Services_JSON();
 102   *
 103   * // convert a complexe value to JSON notation, and send it to the browser
 104   * $value = array('foo', 'bar', array(1, 2, 'baz'), array(3, array(4)));
 105   * $output = $json->encode($value);
 106   *
 107   * print($output);
 108   * // prints: ["foo","bar",[1,2,"baz"],[3,[4]]]
 109   *
 110   * // accept incoming POST data, assumed to be in JSON notation
 111   * $input = file_get_contents('php://input', 1000000);
 112   * $value = $json->decode($input);
 113   * </code>
 114   */
 115  class Services_JSON
 116  {
 117     /**
 118      * constructs a new JSON instance
 119      *
 120      * @param    int     $use    object behavior flags; combine with boolean-OR
 121      *
 122      *                           possible values:
 123      *                           - SERVICES_JSON_LOOSE_TYPE:  loose typing.
 124      *                                   "{...}" syntax creates associative arrays
 125      *                                   instead of objects in decode().
 126      *                           - SERVICES_JSON_SUPPRESS_ERRORS:  error suppression.
 127      *                                   Values which can't be encoded (e.g. resources)
 128      *                                   appear as NULL instead of throwing errors.
 129      *                                   By default, a deeply-nested resource will
 130      *                                   bubble up with an error, so all return values
 131      *                                   from encode() should be checked with isError()
 132      */
 133      function Services_JSON($use = 0)
 134      {
 135          $this->use = $use;
 136      }
 137  
 138     /**
 139      * convert a string from one UTF-16 char to one UTF-8 char
 140      *
 141      * Normally should be handled by mb_convert_encoding, but
 142      * provides a slower PHP-only method for installations
 143      * that lack the multibye string extension.
 144      *
 145      * @param    string  $utf16  UTF-16 character
 146      * @return   string  UTF-8 character
 147      * @access   private
 148      */
 149      function utf162utf8($utf16)
 150      {
 151          // oh please oh please oh please oh please oh please
 152          if(function_exists('mb_convert_encoding')) {
 153              return mb_convert_encoding($utf16, 'UTF-8', 'UTF-16');
 154          }
 155  
 156          $bytes = (ord($utf16{0}) << 8) | ord($utf16{1});
 157  
 158          switch(true) {
 159              case ((0x7F & $bytes) == $bytes):
 160                  // this case should never be reached, because we are in ASCII range
 161                  // see: http://www.cl.cam.ac.uk/~mgk25/unicode.html#utf-8
 162                  return chr(0x7F & $bytes);
 163  
 164              case (0x07FF & $bytes) == $bytes:
 165                  // return a 2-byte UTF-8 character
 166                  // see: http://www.cl.cam.ac.uk/~mgk25/unicode.html#utf-8
 167                  return chr(0xC0 | (($bytes >> 6) & 0x1F))
 168                       . chr(0x80 | ($bytes & 0x3F));
 169  
 170              case (0xFFFF & $bytes) == $bytes:
 171                  // return a 3-byte UTF-8 character
 172                  // see: http://www.cl.cam.ac.uk/~mgk25/unicode.html#utf-8
 173                  return chr(0xE0 | (($bytes >> 12) & 0x0F))
 174                       . chr(0x80 | (($bytes >> 6) & 0x3F))
 175                       . chr(0x80 | ($bytes & 0x3F));
 176          }
 177  
 178          // ignoring UTF-32 for now, sorry
 179          return '';
 180      }
 181  
 182     /**
 183      * convert a string from one UTF-8 char to one UTF-16 char
 184      *
 185      * Normally should be handled by mb_convert_encoding, but
 186      * provides a slower PHP-only method for installations
 187      * that lack the multibye string extension.
 188      *
 189      * @param    string  $utf8   UTF-8 character
 190      * @return   string  UTF-16 character
 191      * @access   private
 192      */
 193      function utf82utf16($utf8)
 194      {
 195          // oh please oh please oh please oh please oh please
 196          if(function_exists('mb_convert_encoding')) {
 197              return mb_convert_encoding($utf8, 'UTF-16', 'UTF-8');
 198          }
 199  
 200          switch(strlen($utf8)) {
 201              case 1:
 202                  // this case should never be reached, because we are in ASCII range
 203                  // see: http://www.cl.cam.ac.uk/~mgk25/unicode.html#utf-8
 204                  return $utf8;
 205  
 206              case 2:
 207                  // return a UTF-16 character from a 2-byte UTF-8 char
 208                  // see: http://www.cl.cam.ac.uk/~mgk25/unicode.html#utf-8
 209                  return chr(0x07 & (ord($utf8{0}) >> 2))
 210                       . chr((0xC0 & (ord($utf8{0}) << 6))
 211                           | (0x3F & ord($utf8{1})));
 212  
 213              case 3:
 214                  // return a UTF-16 character from a 3-byte UTF-8 char
 215                  // see: http://www.cl.cam.ac.uk/~mgk25/unicode.html#utf-8
 216                  return chr((0xF0 & (ord($utf8{0}) << 4))
 217                           | (0x0F & (ord($utf8{1}) >> 2)))
 218                       . chr((0xC0 & (ord($utf8{1}) << 6))
 219                           | (0x7F & ord($utf8{2})));
 220          }
 221  
 222          // ignoring UTF-32 for now, sorry
 223          return '';
 224      }
 225  
 226     /**
 227      * encodes an arbitrary variable into JSON format
 228      *
 229      * @param    mixed   $var    any number, boolean, string, array, or object to be encoded.
 230      *                           see argument 1 to Services_JSON() above for array-parsing behavior.
 231      *                           if var is a strng, note that encode() always expects it
 232      *                           to be in ASCII or UTF-8 format!
 233      *
 234      * @return   mixed   JSON string representation of input var or an error if a problem occurs
 235      * @access   public
 236      */
 237      function encode($var)
 238      {
 239          switch (gettype($var)) {
 240              case 'boolean':
 241                  return $var ? 'true' : 'false';
 242  
 243              case 'NULL':
 244                  return 'null';
 245  
 246              case 'integer':
 247                  return (int) $var;
 248  
 249              case 'double':
 250              case 'float':
 251                  return (float) $var;
 252  
 253              case 'string':
 254                  // STRINGS ARE EXPECTED TO BE IN ASCII OR UTF-8 FORMAT
 255                  $ascii = '';
 256                  $strlen_var = strlen($var);
 257  
 258                 /*
 259                  * Iterate over every character in the string,
 260                  * escaping with a slash or encoding to UTF-8 where necessary
 261                  */
 262                  for ($c = 0; $c < $strlen_var; ++$c) {
 263  
 264                      $ord_var_c = ord($var{$c});
 265  
 266                      switch (true) {
 267                          case $ord_var_c == 0x08:
 268                              $ascii .= '\b';
 269                              break;
 270                          case $ord_var_c == 0x09:
 271                              $ascii .= '\t';
 272                              break;
 273                          case $ord_var_c == 0x0A:
 274                              $ascii .= '\n';
 275                              break;
 276                          case $ord_var_c == 0x0C:
 277                              $ascii .= '\f';
 278                              break;
 279                          case $ord_var_c == 0x0D:
 280                              $ascii .= '\r';
 281                              break;
 282  
 283                          case $ord_var_c == 0x22:
 284                          case $ord_var_c == 0x2F:
 285                          case $ord_var_c == 0x5C:
 286                              // double quote, slash, slosh
 287                              $ascii .= '\\'.$var{$c};
 288                              break;
 289  
 290                          case (($ord_var_c >= 0x20) && ($ord_var_c <= 0x7F)):
 291                              // characters U-00000000 - U-0000007F (same as ASCII)
 292                              $ascii .= $var{$c};
 293                              break;
 294  
 295                          case (($ord_var_c & 0xE0) == 0xC0):
 296                              // characters U-00000080 - U-000007FF, mask 110XXXXX
 297                              // see http://www.cl.cam.ac.uk/~mgk25/unicode.html#utf-8
 298                              $char = pack('C*', $ord_var_c, ord($var{$c + 1}));
 299                              $c += 1;
 300                              $utf16 = $this->utf82utf16($char);
 301                              $ascii .= sprintf('\u%04s', bin2hex($utf16));
 302                              break;
 303  
 304                          case (($ord_var_c & 0xF0) == 0xE0):
 305                              // characters U-00000800 - U-0000FFFF, mask 1110XXXX
 306                              // see http://www.cl.cam.ac.uk/~mgk25/unicode.html#utf-8
 307                              $char = pack('C*', $ord_var_c,
 308                                           ord($var{$c + 1}),
 309                                           ord($var{$c + 2}));
 310                              $c += 2;
 311                              $utf16 = $this->utf82utf16($char);
 312                              $ascii .= sprintf('\u%04s', bin2hex($utf16));
 313                              break;
 314  
 315                          case (($ord_var_c & 0xF8) == 0xF0):
 316                              // characters U-00010000 - U-001FFFFF, mask 11110XXX
 317                              // see http://www.cl.cam.ac.uk/~mgk25/unicode.html#utf-8
 318                              $char = pack('C*', $ord_var_c,
 319                                           ord($var{$c + 1}),
 320                                           ord($var{$c + 2}),
 321                                           ord($var{$c + 3}));
 322                              $c += 3;
 323                              $utf16 = $this->utf82utf16($char);
 324                              $ascii .= sprintf('\u%04s', bin2hex($utf16));
 325                              break;
 326  
 327                          case (($ord_var_c & 0xFC) == 0xF8):
 328                              // characters U-00200000 - U-03FFFFFF, mask 111110XX
 329                              // see http://www.cl.cam.ac.uk/~mgk25/unicode.html#utf-8
 330                              $char = pack('C*', $ord_var_c,
 331                                           ord($var{$c + 1}),
 332                                           ord($var{$c + 2}),
 333                                           ord($var{$c + 3}),
 334                                           ord($var{$c + 4}));
 335                              $c += 4;
 336                              $utf16 = $this->utf82utf16($char);
 337                              $ascii .= sprintf('\u%04s', bin2hex($utf16));
 338                              break;
 339  
 340                          case (($ord_var_c & 0xFE) == 0xFC):
 341                              // characters U-04000000 - U-7FFFFFFF, mask 1111110X
 342                              // see http://www.cl.cam.ac.uk/~mgk25/unicode.html#utf-8
 343                              $char = pack('C*', $ord_var_c,
 344                                           ord($var{$c + 1}),
 345                                           ord($var{$c + 2}),
 346                                           ord($var{$c + 3}),
 347                                           ord($var{$c + 4}),
 348                                           ord($var{$c + 5}));
 349                              $c += 5;
 350                              $utf16 = $this->utf82utf16($char);
 351                              $ascii .= sprintf('\u%04s', bin2hex($utf16));
 352                              break;
 353                      }
 354                  }
 355  
 356                  return '"'.$ascii.'"';
 357  
 358              case 'array':
 359                 /*
 360                  * As per JSON spec if any array key is not an integer
 361                  * we must treat the the whole array as an object. We
 362                  * also try to catch a sparsely populated associative
 363                  * array with numeric keys here because some JS engines
 364                  * will create an array with empty indexes up to
 365                  * max_index which can cause memory issues and because
 366                  * the keys, which may be relevant, will be remapped
 367                  * otherwise.
 368                  *
 369                  * As per the ECMA and JSON specification an object may
 370                  * have any string as a property. Unfortunately due to
 371                  * a hole in the ECMA specification if the key is a
 372                  * ECMA reserved word or starts with a digit the
 373                  * parameter is only accessible using ECMAScript's
 374                  * bracket notation.
 375                  */
 376  
 377                  // treat as a JSON object
 378                  if (is_array($var) && count($var) && (array_keys($var) !== range(0, sizeof($var) - 1))) {
 379                      $properties = array_map(array($this, 'name_value'),
 380                                              array_keys($var),
 381                                              array_values($var));
 382  
 383                      foreach($properties as $property) {
 384                          if(Services_JSON::isError($property)) {
 385                              return $property;
 386                          }
 387                      }
 388  
 389                      return '{' . join(',', $properties) . '}';
 390                  }
 391  
 392                  // treat it like a regular array
 393                  $elements = array_map(array($this, 'encode'), $var);
 394  
 395                  foreach($elements as $element) {
 396                      if(Services_JSON::isError($element)) {
 397                          return $element;
 398                      }
 399                  }
 400  
 401                  return '[' . join(',', $elements) . ']';
 402  
 403              case 'object':
 404                  $vars = get_object_vars($var);
 405  
 406                  $properties = array_map(array($this, 'name_value'),
 407                                          array_keys($vars),
 408                                          array_values($vars));
 409  
 410                  foreach($properties as $property) {
 411                      if(Services_JSON::isError($property)) {
 412                          return $property;
 413                      }
 414                  }
 415  
 416                  return '{' . join(',', $properties) . '}';
 417  
 418              default:
 419                  return ($this->use & SERVICES_JSON_SUPPRESS_ERRORS)
 420                      ? 'null'
 421                      : new Services_JSON_Error(gettype($var)." can not be encoded as JSON string");
 422          }
 423      }
 424  
 425     /**
 426      * array-walking function for use in generating JSON-formatted name-value pairs
 427      *
 428      * @param    string  $name   name of key to use
 429      * @param    mixed   $value  reference to an array element to be encoded
 430      *
 431      * @return   string  JSON-formatted name-value pair, like '"name":value'
 432      * @access   private
 433      */
 434      function name_value($name, $value)
 435      {
 436          $encoded_value = $this->encode($value);
 437  
 438          if(Services_JSON::isError($encoded_value)) {
 439              return $encoded_value;
 440          }
 441  
 442          return $this->encode(strval($name)) . ':' . $encoded_value;
 443      }
 444  
 445     /**
 446      * reduce a string by removing leading and trailing comments and whitespace
 447      *
 448      * @param    $str    string      string value to strip of comments and whitespace
 449      *
 450      * @return   string  string value stripped of comments and whitespace
 451      * @access   private
 452      */
 453      function reduce_string($str)
 454      {
 455          $str = preg_replace(array(
 456  
 457                  // eliminate single line comments in '// ...' form
 458                  '#^\s*//(.+)$#m',
 459  
 460                  // eliminate multi-line comments in '/* ... */' form, at start of string
 461                  '#^\s*/\*(.+)\*/#Us',
 462  
 463                  // eliminate multi-line comments in '/* ... */' form, at end of string
 464                  '#/\*(.+)\*/\s*$#Us'
 465  
 466              ), '', $str);
 467  
 468          // eliminate extraneous space
 469          return trim($str);
 470      }
 471  
 472     /**
 473      * decodes a JSON string into appropriate variable
 474      *
 475      * @param    string  $str    JSON-formatted string
 476      *
 477      * @return   mixed   number, boolean, string, array, or object
 478      *                   corresponding to given JSON input string.
 479      *                   See argument 1 to Services_JSON() above for object-output behavior.
 480      *                   Note that decode() always returns strings
 481      *                   in ASCII or UTF-8 format!
 482      * @access   public
 483      */
 484      function decode($str)
 485      {
 486          $str = $this->reduce_string($str);
 487  
 488          switch (strtolower($str)) {
 489              case 'true':
 490                  return true;
 491  
 492              case 'false':
 493                  return false;
 494  
 495              case 'null':
 496                  return null;
 497  
 498              default:
 499                  $m = array();
 500  
 501                  if (is_numeric($str)) {
 502                      // Lookie-loo, it's a number
 503  
 504                      // This would work on its own, but I'm trying to be
 505                      // good about returning integers where appropriate:
 506                      // return (float)$str;
 507  
 508                      // Return float or int, as appropriate
 509                      return ((float)$str == (integer)$str)
 510                          ? (integer)$str
 511                          : (float)$str;
 512  
 513                  } elseif (preg_match('/^("|\').*(\1)$/s', $str, $m) && $m[1] == $m[2]) {
 514                      // STRINGS RETURNED IN UTF-8 FORMAT
 515                      $delim = substr($str, 0, 1);
 516                      $chrs = substr($str, 1, -1);
 517                      $utf8 = '';
 518                      $strlen_chrs = strlen($chrs);
 519  
 520                      for ($c = 0; $c < $strlen_chrs; ++$c) {
 521  
 522                          $substr_chrs_c_2 = substr($chrs, $c, 2);
 523                          $ord_chrs_c = ord($chrs{$c});
 524  
 525                          switch (true) {
 526                              case $substr_chrs_c_2 == '\b':
 527                                  $utf8 .= chr(0x08);
 528                                  ++$c;
 529                                  break;
 530                              case $substr_chrs_c_2 == '\t':
 531                                  $utf8 .= chr(0x09);
 532                                  ++$c;
 533                                  break;
 534                              case $substr_chrs_c_2 == '\n':
 535                                  $utf8 .= chr(0x0A);
 536                                  ++$c;
 537                                  break;
 538                              case $substr_chrs_c_2 == '\f':
 539                                  $utf8 .= chr(0x0C);
 540                                  ++$c;
 541                                  break;
 542                              case $substr_chrs_c_2 == '\r':
 543                                  $utf8 .= chr(0x0D);
 544                                  ++$c;
 545                                  break;
 546  
 547                              case $substr_chrs_c_2 == '\\"':
 548                              case $substr_chrs_c_2 == '\\\'':
 549                              case $substr_chrs_c_2 == '\\\\':
 550                              case $substr_chrs_c_2 == '\\/':
 551                                  if (($delim == '"' && $substr_chrs_c_2 != '\\\'') ||
 552                                     ($delim == "'" && $substr_chrs_c_2 != '\\"')) {
 553                                      $utf8 .= $chrs{++$c};
 554                                  }
 555                                  break;
 556  
 557                              case preg_match('/\\\u[0-9A-F]{4}/i', substr($chrs, $c, 6)):
 558                                  // single, escaped unicode character
 559                                  $utf16 = chr(hexdec(substr($chrs, ($c + 2), 2)))
 560                                         . chr(hexdec(substr($chrs, ($c + 4), 2)));
 561                                  $utf8 .= $this->utf162utf8($utf16);
 562                                  $c += 5;
 563                                  break;
 564  
 565                              case ($ord_chrs_c >= 0x20) && ($ord_chrs_c <= 0x7F):
 566                                  $utf8 .= $chrs{$c};
 567                                  break;
 568  
 569                              case ($ord_chrs_c & 0xE0) == 0xC0:
 570                                  // characters U-00000080 - U-000007FF, mask 110XXXXX
 571                                  //see http://www.cl.cam.ac.uk/~mgk25/unicode.html#utf-8
 572                                  $utf8 .= substr($chrs, $c, 2);
 573                                  ++$c;
 574                                  break;
 575  
 576                              case ($ord_chrs_c & 0xF0) == 0xE0:
 577                                  // characters U-00000800 - U-0000FFFF, mask 1110XXXX
 578                                  // see http://www.cl.cam.ac.uk/~mgk25/unicode.html#utf-8
 579                                  $utf8 .= substr($chrs, $c, 3);
 580                                  $c += 2;
 581                                  break;
 582  
 583                              case ($ord_chrs_c & 0xF8) == 0xF0:
 584                                  // characters U-00010000 - U-001FFFFF, mask 11110XXX
 585                                  // see http://www.cl.cam.ac.uk/~mgk25/unicode.html#utf-8
 586                                  $utf8 .= substr($chrs, $c, 4);
 587                                  $c += 3;
 588                                  break;
 589  
 590                              case ($ord_chrs_c & 0xFC) == 0xF8:
 591                                  // characters U-00200000 - U-03FFFFFF, mask 111110XX
 592                                  // see http://www.cl.cam.ac.uk/~mgk25/unicode.html#utf-8
 593                                  $utf8 .= substr($chrs, $c, 5);
 594                                  $c += 4;
 595                                  break;
 596  
 597                              case ($ord_chrs_c & 0xFE) == 0xFC:
 598                                  // characters U-04000000 - U-7FFFFFFF, mask 1111110X
 599                                  // see http://www.cl.cam.ac.uk/~mgk25/unicode.html#utf-8
 600                                  $utf8 .= substr($chrs, $c, 6);
 601                                  $c += 5;
 602                                  break;
 603  
 604                          }
 605  
 606                      }
 607  
 608                      return $utf8;
 609  
 610                  } elseif (preg_match('/^\[.*\]$/s', $str) || preg_match('/^\{.*\}$/s', $str)) {
 611                      // array, or object notation
 612  
 613                      if ($str{0} == '[') {
 614                          $stk = array(SERVICES_JSON_IN_ARR);
 615                          $arr = array();
 616                      } else {
 617                          if ($this->use & SERVICES_JSON_LOOSE_TYPE) {
 618                              $stk = array(SERVICES_JSON_IN_OBJ);
 619                              $obj = array();
 620                          } else {
 621                              $stk = array(SERVICES_JSON_IN_OBJ);
 622                              $obj = new stdClass();
 623                          }
 624                      }
 625  
 626                      array_push($stk, array('what'  => SERVICES_JSON_SLICE,
 627                                             'where' => 0,
 628                                             'delim' => false));
 629  
 630                      $chrs = substr($str, 1, -1);
 631                      $chrs = $this->reduce_string($chrs);
 632  
 633                      if ($chrs == '') {
 634                          if (reset($stk) == SERVICES_JSON_IN_ARR) {
 635                              return $arr;
 636  
 637                          } else {
 638                              return $obj;
 639  
 640                          }
 641                      }
 642  
 643                      //print("\nparsing {$chrs}\n");
 644  
 645                      $strlen_chrs = strlen($chrs);
 646  
 647                      for ($c = 0; $c <= $strlen_chrs; ++$c) {
 648  
 649                          $top = end($stk);
 650                          $substr_chrs_c_2 = substr($chrs, $c, 2);
 651  
 652                          if (($c == $strlen_chrs) || (($chrs{$c} == ',') && ($top['what'] == SERVICES_JSON_SLICE))) {
 653                              // found a comma that is not inside a string, array, etc.,
 654                              // OR we've reached the end of the character list
 655                              $slice = substr($chrs, $top['where'], ($c - $top['where']));
 656                              array_push($stk, array('what' => SERVICES_JSON_SLICE, 'where' => ($c + 1), 'delim' => false));
 657                              //print("Found split at {$c}: ".substr($chrs, $top['where'], (1 + $c - $top['where']))."\n");
 658  
 659                              if (reset($stk) == SERVICES_JSON_IN_ARR) {
 660                                  // we are in an array, so just push an element onto the stack
 661                                  array_push($arr, $this->decode($slice));
 662  
 663                              } elseif (reset($stk) == SERVICES_JSON_IN_OBJ) {
 664                                  // we are in an object, so figure
 665                                  // out the property name and set an
 666                                  // element in an associative array,
 667                                  // for now
 668                                  $parts = array();
 669                                  
 670                                  if (preg_match('/^\s*(["\'].*[^\\\]["\'])\s*:\s*(\S.*),?$/Uis', $slice, $parts)) {
 671                                      // "name":value pair
 672                                      $key = $this->decode($parts[1]);
 673                                      $val = $this->decode($parts[2]);
 674  
 675                                      if ($this->use & SERVICES_JSON_LOOSE_TYPE) {
 676                                          $obj[$key] = $val;
 677                                      } else {
 678                                          $obj->$key = $val;
 679                                      }
 680                                  } elseif (preg_match('/^\s*(\w+)\s*:\s*(\S.*),?$/Uis', $slice, $parts)) {
 681                                      // name:value pair, where name is unquoted
 682                                      $key = $parts[1];
 683                                      $val = $this->decode($parts[2]);
 684  
 685                                      if ($this->use & SERVICES_JSON_LOOSE_TYPE) {
 686                                          $obj[$key] = $val;
 687                                      } else {
 688                                          $obj->$key = $val;
 689                                      }
 690                                  }
 691  
 692                              }
 693  
 694                          } elseif ((($chrs{$c} == '"') || ($chrs{$c} == "'")) && ($top['what'] != SERVICES_JSON_IN_STR)) {
 695                              // found a quote, and we are not inside a string
 696                              array_push($stk, array('what' => SERVICES_JSON_IN_STR, 'where' => $c, 'delim' => $chrs{$c}));
 697                              //print("Found start of string at {$c}\n");
 698  
 699                          } elseif (($chrs{$c} == $top['delim']) &&
 700                                   ($top['what'] == SERVICES_JSON_IN_STR) &&
 701                                   ((strlen(substr($chrs, 0, $c)) - strlen(rtrim(substr($chrs, 0, $c), '\\'))) % 2 != 1)) {
 702                              // found a quote, we're in a string, and it's not escaped
 703                              // we know that it's not escaped becase there is _not_ an
 704                              // odd number of backslashes at the end of the string so far
 705                              array_pop($stk);
 706                              //print("Found end of string at {$c}: ".substr($chrs, $top['where'], (1 + 1 + $c - $top['where']))."\n");
 707  
 708                          } elseif (($chrs{$c} == '[') &&
 709                                   in_array($top['what'], array(SERVICES_JSON_SLICE, SERVICES_JSON_IN_ARR, SERVICES_JSON_IN_OBJ))) {
 710                              // found a left-bracket, and we are in an array, object, or slice
 711                              array_push($stk, array('what' => SERVICES_JSON_IN_ARR, 'where' => $c, 'delim' => false));
 712                              //print("Found start of array at {$c}\n");
 713  
 714                          } elseif (($chrs{$c} == ']') && ($top['what'] == SERVICES_JSON_IN_ARR)) {
 715                              // found a right-bracket, and we're in an array
 716                              array_pop($stk);
 717                              //print("Found end of array at {$c}: ".substr($chrs, $top['where'], (1 + $c - $top['where']))."\n");
 718  
 719                          } elseif (($chrs{$c} == '{') &&
 720                                   in_array($top['what'], array(SERVICES_JSON_SLICE, SERVICES_JSON_IN_ARR, SERVICES_JSON_IN_OBJ))) {
 721                              // found a left-brace, and we are in an array, object, or slice
 722                              array_push($stk, array('what' => SERVICES_JSON_IN_OBJ, 'where' => $c, 'delim' => false));
 723                              //print("Found start of object at {$c}\n");
 724  
 725                          } elseif (($chrs{$c} == '}') && ($top['what'] == SERVICES_JSON_IN_OBJ)) {
 726                              // found a right-brace, and we're in an object
 727                              array_pop($stk);
 728                              //print("Found end of object at {$c}: ".substr($chrs, $top['where'], (1 + $c - $top['where']))."\n");
 729  
 730                          } elseif (($substr_chrs_c_2 == '/*') &&
 731                                   in_array($top['what'], array(SERVICES_JSON_SLICE, SERVICES_JSON_IN_ARR, SERVICES_JSON_IN_OBJ))) {
 732                              // found a comment start, and we are in an array, object, or slice
 733                              array_push($stk, array('what' => SERVICES_JSON_IN_CMT, 'where' => $c, 'delim' => false));
 734                              $c++;
 735                              //print("Found start of comment at {$c}\n");
 736  
 737                          } elseif (($substr_chrs_c_2 == '*/') && ($top['what'] == SERVICES_JSON_IN_CMT)) {
 738                              // found a comment end, and we're in one now
 739                              array_pop($stk);
 740                              $c++;
 741  
 742                              for ($i = $top['where']; $i <= $c; ++$i)
 743                                  $chrs = substr_replace($chrs, ' ', $i, 1);
 744  
 745                              //print("Found end of comment at {$c}: ".substr($chrs, $top['where'], (1 + $c - $top['where']))."\n");
 746  
 747                          }
 748  
 749                      }
 750  
 751                      if (reset($stk) == SERVICES_JSON_IN_ARR) {
 752                          return $arr;
 753  
 754                      } elseif (reset($stk) == SERVICES_JSON_IN_OBJ) {
 755                          return $obj;
 756  
 757                      }
 758  
 759                  }
 760          }
 761      }
 762  
 763      /**
 764       * @todo Ultimately, this should just call PEAR::isError()
 765       */
 766      function isError($data, $code = null)
 767      {
 768          if (class_exists('pear')) {
 769              return PEAR::isError($data, $code);
 770          } elseif (is_object($data) && (get_class($data) == 'services_json_error' ||
 771                                   is_subclass_of($data, 'services_json_error'))) {
 772              return true;
 773          }
 774  
 775          return false;
 776      }
 777  }
 778  
 779  if (class_exists('PEAR_Error')) {
 780  
 781      class Services_JSON_Error extends PEAR_Error
 782      {
 783          function Services_JSON_Error($message = 'unknown error', $code = null,
 784                                       $mode = null, $options = null, $userinfo = null)
 785          {
 786              parent::PEAR_Error($message, $code, $mode, $options, $userinfo);
 787          }
 788      }
 789  
 790  } else {
 791  
 792      /**
 793       * @todo Ultimately, this class shall be descended from PEAR_Error
 794       */
 795      class Services_JSON_Error
 796      {
 797          function Services_JSON_Error($message = 'unknown error', $code = null,
 798                                       $mode = null, $options = null, $userinfo = null)
 799          {
 800  
 801          }
 802      }
 803  
 804  }
 805      
 806  ?>


Generated: Wed Dec 30 05:55:15 2009 Cross-referenced by PHPXref 0.7