<?php /** * Zend Framework * * LICENSE * * This source file is subject to the new BSD license that is bundled * with this package in the file LICENSE.txt. * It is also available through the world-wide-web at this URL: * http://framework.zend.com/license/new-bsd * If you did not receive a copy of the license and are unable to * obtain it through the world-wide-web, please send an email * to license@zend.com so we can send you a copy immediately. * * @category Zend * @package Zend_Serializer * @subpackage Adapter * @copyright Copyright (c) 2005-2014 Zend Technologies USA Inc. (http://www.zend.com) * @license http://framework.zend.com/license/new-bsd New BSD License * @version $Id$ */ /** @see Zend_Serializer_Adapter_AdapterAbstract */ require_once 'Zend/Serializer/Adapter/AdapterAbstract.php'; /** * @link http://www.python.org * @see Phython3.1/Lib/pickle.py * @see Phython3.1/Modules/_pickle.c * @link http://pickle-js.googlecode.com * @category Zend * @package Zend_Serializer * @subpackage Adapter * @copyright Copyright (c) 2005-2014 Zend Technologies USA Inc. (http://www.zend.com) * @license http://framework.zend.com/license/new-bsd New BSD License */ class Zend_Serializer_Adapter_PythonPickle extends Zend_Serializer_Adapter_AdapterAbstract { /* Pickle opcodes. See pickletools.py for extensive docs. The listing here is in kind-of alphabetical order of 1-character pickle code. pickletools groups them by purpose. */ const OP_MARK = '('; // push special markobject on stack const OP_STOP = '.'; // every pickle ends with STOP const OP_POP = '0'; // discard topmost stack item const OP_POP_MARK = '1'; // discard stack top through topmost markobject const OP_DUP = '2'; // duplicate top stack item const OP_FLOAT = 'F'; // push float object; decimal string argument const OP_INT = 'I'; // push integer or bool; decimal string argument const OP_BININT = 'J'; // push four-byte signed int const OP_BININT1 = 'K'; // push 1-byte unsigned int const OP_LONG = 'L'; // push long; decimal string argument const OP_BININT2 = 'M'; // push 2-byte unsigned int const OP_NONE = 'N'; // push None const OP_PERSID = 'P'; // push persistent object; id is taken from string arg const OP_BINPERSID = 'Q'; // " " " ; " " " " stack const OP_REDUCE = 'R'; // apply callable to argtuple, both on stack const OP_STRING = 'S'; // push string; NL-terminated string argument const OP_BINSTRING = 'T'; // push string; counted binary string argument const OP_SHORT_BINSTRING = 'U'; // " " ; " " " " < 256 bytes const OP_UNICODE = 'V'; // push Unicode string; raw-unicode-escaped'd argument const OP_BINUNICODE = 'X'; // " " " ; counted UTF-8 string argument const OP_APPEND = 'a'; // append stack top to list below it const OP_BUILD = 'b'; // call __setstate__ or __dict__.update() const OP_GLOBAL = 'c'; // push self.find_class(modname, name); 2 string args const OP_DICT = 'd'; // build a dict from stack items const OP_EMPTY_DICT = '}'; // push empty dict const OP_APPENDS = 'e'; // extend list on stack by topmost stack slice const OP_GET = 'g'; // push item from memo on stack; index is string arg const OP_BINGET = 'h'; // " " " " " " ; " " 1-byte arg const OP_INST = 'i'; // build & push class instance const OP_LONG_BINGET = 'j'; // push item from memo on stack; index is 4-byte arg const OP_LIST = 'l'; // build list from topmost stack items const OP_EMPTY_LIST = ']'; // push empty list const OP_OBJ = 'o'; // build & push class instance const OP_PUT = 'p'; // store stack top in memo; index is string arg const OP_BINPUT = 'q'; // " " " " " ; " " 1-byte arg const OP_LONG_BINPUT = 'r'; // " " " " " ; " " 4-byte arg const OP_SETITEM = 's'; // add key+value pair to dict const OP_TUPLE = 't'; // build tuple from topmost stack items const OP_EMPTY_TUPLE = ')'; // push empty tuple const OP_SETITEMS = 'u'; // modify dict by adding topmost key+value pairs const OP_BINFLOAT = 'G'; // push float; arg is 8-byte float encoding /* Protocol 2 */ const OP_PROTO = "\x80"; // identify pickle protocol const OP_NEWOBJ = "\x81"; // build object by applying cls.__new__ to argtuple const OP_EXT1 = "\x82"; // push object from extension registry; 1-byte index const OP_EXT2 = "\x83"; // ditto, but 2-byte index const OP_EXT4 = "\x84"; // ditto, but 4-byte index const OP_TUPLE1 = "\x85"; // build 1-tuple from stack top const OP_TUPLE2 = "\x86"; // build 2-tuple from two topmost stack items const OP_TUPLE3 = "\x87"; // build 3-tuple from three topmost stack items const OP_NEWTRUE = "\x88"; // push True const OP_NEWFALSE = "\x89"; // push False const OP_LONG1 = "\x8a"; // push long from < 256 bytes const OP_LONG4 = "\x8b"; // push really big long /* Protocol 3 (Python 3.x) */ const OP_BINBYTES = 'B'; // push bytes; counted binary string argument const OP_SHORT_BINBYTES = 'C'; // " " ; " " " " < 256 bytes /** * @var bool Whether or not this is a PHP 6 binary */ protected static $_isPhp6 = null; /** * @var bool Whether or not the system is little-endian */ protected static $_isLittleEndian = null; /** * @var array Strings representing quotes */ protected static $_quoteString = array( '\\' => '\\\\', "\x00" => '\\x00', "\x01" => '\\x01', "\x02" => '\\x02', "\x03" => '\\x03', "\x04" => '\\x04', "\x05" => '\\x05', "\x06" => '\\x06', "\x07" => '\\x07', "\x08" => '\\x08', "\x09" => '\\t', "\x0a" => '\\n', "\x0b" => '\\x0b', "\x0c" => '\\x0c', "\x0d" => '\\r', "\x0e" => '\\x0e', "\x0f" => '\\x0f', "\x10" => '\\x10', "\x11" => '\\x11', "\x12" => '\\x12', "\x13" => '\\x13', "\x14" => '\\x14', "\x15" => '\\x15', "\x16" => '\\x16', "\x17" => '\\x17', "\x18" => '\\x18', "\x19" => '\\x19', "\x1a" => '\\x1a', "\x1b" => '\\x1b', "\x1c" => '\\x1c', "\x1d" => '\\x1d', "\x1e" => '\\x1e', "\x1f" => '\\x1f', "\xff" => '\\xff' ); /** * @var array Default options */ protected $_options = array( 'protocol' => 0, ); // process vars protected $_protocol = 0; protected $_binary = false; protected $_memo = array(); protected $_pickle = ''; protected $_pickleLen = 0; protected $_pos = 0; protected $_stack = array(); protected $_marker = null; /** * Constructor * * @link Zend_Serializer_Adapter_AdapterAbstract::__construct() */ public function __construct($opts=array()) { parent::__construct($opts); // init if (self::$_isLittleEndian === null) { self::$_isLittleEndian = (pack('l', 1) === "\x01\x00\x00\x00"); } if (self::$_isPhp6 === null) { self::$_isPhp6 = !version_compare(PHP_VERSION, '6.0.0', '<'); } $this->_marker = new stdClass(); } /** * Set an option * * @link Zend_Serializer_Adapter_AdapterAbstract::setOption() * @param string $name * @param mixed $value * @return Zend_Serializer_Adapter_PythonPickle */ public function setOption($name, $value) { switch ($name) { case 'protocol': $value = $this->_checkProtocolNumber($value); break; } return parent::setOption($name, $value); } /** * Check and normalize pickle protocol number * * @param int $number * @return int * @throws Zend_Serializer_Exception */ protected function _checkProtocolNumber($number) { $int = (int) $number; if ($int < 0 || $int > 3) { require_once 'Zend/Serializer/Exception.php'; throw new Zend_Serializer_Exception('Invalid or unknown protocol version "'.$number.'"'); } return $int; } /* serialize */ /** * Serialize PHP to PythonPickle format * * @param mixed $value * @param array $opts * @return string */ public function serialize($value, array $opts = array()) { $opts = $opts + $this->_options; $this->_protocol = $this->_checkProtocolNumber($opts['protocol']); $this->_binary = $this->_protocol != 0; // clear process vars before serializing $this->_memo = array(); $this->_pickle = ''; // write if ($this->_protocol >= 2) { $this->_writeProto($this->_protocol); } $this->_write($value); $this->_writeStop(); // clear process vars after serializing $this->_memo = array(); $pickle = $this->_pickle; $this->_pickle = ''; return $pickle; } /** * Write a value * * @param mixed $value * @return void * @throws Zend_Serializer_Exception on invalid or unrecognized value type */ protected function _write($value) { if ($value === null) { $this->_writeNull(); } elseif ($value === true) { $this->_writeTrue(); } elseif ($value === false) { $this->_writeFalse(); } elseif (is_int($value)) { $this->_writeInt($value); } elseif (is_float($value)) { $this->_writeFloat($value); } elseif (is_string($value)) { // TODO: write unicode / binary $this->_writeString($value); } elseif (is_array($value)) { if ($this->_isArrayAssoc($value)) { $this->_writeArrayDict($value); } else { $this->_writeArrayList($value); } } elseif (is_object($value)) { $this->_writeObject($value); } else { require_once 'Zend/Serializer/Exception.php'; throw new Zend_Serializer_Exception( 'PHP-Type "'.gettype($value).'" isn\'t serializable with '.get_class($this) ); } } /** * Write pickle protocol * * @param int $protocol * @return void */ protected function _writeProto($protocol) { $this->_pickle .= self::OP_PROTO . $protocol; } /** * Write a get * * @param int $id Id of memo * @return void */ protected function _writeGet($id) { if ($this->_binary) { if ($id <= 0xff) { // BINGET + chr(i) $this->_pickle .= self::OP_BINGET . chr($id); } else { // LONG_BINGET + pack("<i", i) $bin = pack('l', $id); if (self::$_isLittleEndian === false) { $bin = strrev($bin); } $this->_pickle .= self::OP_LONG_BINGET . $bin; } } else { $this->_pickle .= self::OP_GET . $id . "\r\n"; } } /** * Write a put * * @param int $id Id of memo * @return void */ protected function _writePut($id) { if ($this->_binary) { if ($id <= 0xff) { // BINPUT + chr(i) $this->_pickle .= self::OP_BINPUT . chr($id); } else { // LONG_BINPUT + pack("<i", i) $bin = pack('l', $id); if (self::$_isLittleEndian === false) { $bin = strrev($bin); } $this->_pickle .= self::OP_LONG_BINPUT . $bin; } } else { $this->_pickle .= self::OP_PUT . $id . "\r\n"; } } /** * Write a null as None * * @return void */ protected function _writeNull() { $this->_pickle .= self::OP_NONE; } /** * Write a boolean true * * @return void */ protected function _writeTrue() { if ($this->_protocol >= 2) { $this->_pickle .= self::OP_NEWTRUE; } else { $this->_pickle .= self::OP_INT . "01\r\n"; } } /** * Write a boolean false * * @return void */ protected function _writeFalse() { if ($this->_protocol >= 2) { $this->_pickle .= self::OP_NEWFALSE; } else { $this->_pickle .= self::OP_INT . "00\r\n"; } } /** * Write an integer value * * @param int $value * @return void */ protected function _writeInt($value) { if ($this->_binary) { if ($value >= 0) { if ($value <= 0xff) { // self.write(BININT1 + chr(obj)) $this->_pickle .= self::OP_BININT1 . chr($value); } elseif ($value <= 0xffff) { // self.write("%c%c%c" % (BININT2, obj&0xff, obj>>8)) $this->_pickle .= self::OP_BININT2 . pack('v', $value); } return; } // Next check for 4-byte signed ints: $highBits = $value >> 31; // note that Python shift sign-extends if ($highBits == 0 || $highBits == -1) { // All high bits are copies of bit 2**31, so the value // fits in a 4-byte signed int. // self.write(BININT + pack("<i", obj)) $bin = pack('l', $value); if (self::$_isLittleEndian === false) { $bin = strrev($bin); } $this->_pickle .= self::OP_BININT . $bin; return; } } $this->_pickle .= self::OP_INT . $value . "\r\n"; } /** * Write a float value * * @param float $value * @return void */ protected function _writeFloat($value) { if ($this->_binary) { // self.write(BINFLOAT + pack('>d', obj)) $bin = pack('d', $value); if (self::$_isLittleEndian === true) { $bin = strrev($bin); } $this->_pickle .= self::OP_BINFLOAT . $bin; } else { $this->_pickle .= self::OP_FLOAT . $value . "\r\n"; } } /** * Write a string value * * @param string $value * @return void */ protected function _writeString($value) { if ( ($id=$this->_searchMomo($value)) !== false ) { $this->_writeGet($id); return; } if ($this->_binary) { $n = strlen($value); if ($n <= 0xff) { // self.write(SHORT_BINSTRING + chr(n) + obj) $this->_pickle .= self::OP_SHORT_BINSTRING . chr($n) . $value; } else { // self.write(BINSTRING + pack("<i", n) + obj) $binLen = pack('l', $n); if (self::$_isLittleEndian === false) { $binLen = strrev($binLen); } $this->_pickle .= self::OP_BINSTRING . $binLen . $value; } } else { $this->_pickle .= self::OP_STRING . $this->_quoteString($value) . "\r\n"; } $this->_momorize($value); } /** * Write an associative array value as dictionary * * @param array $value * @return void */ protected function _writeArrayDict(array $value) { if (($id=$this->_searchMomo($value)) !== false) { $this->_writeGet($id);; return; } $this->_pickle .= self::OP_MARK . self::OP_DICT; $this->_momorize($value); foreach ($value as $k => $v) { $this->_pickle .= $this->_write($k) . $this->_write($v) . self::OP_SETITEM; } } /** * Write a simple array value as list * * @param array $value * @return void */ protected function _writeArrayList(array $value) { if (($id = $this->_searchMomo($value)) !== false) { $this->_writeGet($id); return; } $this->_pickle .= self::OP_MARK . self::OP_LIST; $this->_momorize($value); foreach ($value as $k => $v) { $this->_pickle .= $this->_write($v) . self::OP_APPEND; } } /** * Write an object as an dictionary * * @param object $value * @return void */ protected function _writeObject($value) { // can't serialize php objects to python objects yet $this->_writeArrayDict(get_object_vars($value)); } /** * Write stop * * @return void */ protected function _writeStop() { $this->_pickle .= self::OP_STOP; } /* serialize helper */ /** * Add a value to the memo and write the id * * @param mixed $value * @return void */ protected function _momorize($value) { $id = count($this->_memo); $this->_memo[$id] = $value; $this->_writePut($id); } /** * Search a value in the meno and return the id * * @param mixed $value * @return int|false The id or false */ protected function _searchMomo($value) { return array_search($value, $this->_memo, true); } /** * Is an array associative? * * @param array $value * @return boolean */ protected function _isArrayAssoc(array $value) { return array_diff_key($value, array_keys(array_keys($value))); } /** * Quote/Escape a string * * @param string $str * @return string quoted string */ protected function _quoteString($str) { $quoteArr = self::$_quoteString; if (($cntSingleQuote = substr_count($str, "'")) && ($cntDoubleQuote = substr_count($str, '"')) && ($cntSingleQuote < $cntDoubleQuote) ) { $quoteArr['"'] = '\\"'; $enclosure = '"'; } else { $quoteArr["'"] = "\\'"; $enclosure = "'"; } return $enclosure . strtr($str, $quoteArr) . $enclosure; } /* unserialize */ /** * Unserialize from Python Pickle format to PHP * * @param string $pickle * @param array $opts * @return mixed * @throws Zend_Serializer_Exception on invalid Pickle string */ public function unserialize($pickle, array $opts = array()) { // init process vars $this->_pos = 0; $this->_pickle = $pickle; $this->_pickleLen = strlen($this->_pickle); $this->_memo = array(); $this->_stack = array(); // read pickle string while (($op=$this->_read(1)) !== self::OP_STOP) { $this->_load($op); } if (!count($this->_stack)) { require_once 'Zend/Serializer/Exception.php'; throw new Zend_Serializer_Exception('No data found'); } $ret = array_pop($this->_stack); // clear process vars $this->_pos = 0; $this->_pickle = ''; $this->_pickleLen = 0; $this->_memo = array(); $this->_stack = array(); return $ret; } /** * Load a pickle opcode * * @param string $op * @return void * @throws Zend_Serializer_Exception on invalid opcode */ protected function _load($op) { switch ($op) { case self::OP_PUT: $this->_loadPut(); break; case self::OP_BINPUT: $this->_loadBinPut(); break; case self::OP_LONG_BINPUT: $this->_loadLongBinPut(); break; case self::OP_GET: $this->_loadGet(); break; case self::OP_BINGET: $this->_loadBinGet(); break; case self::OP_LONG_BINGET: $this->_loadLongBinGet(); break; case self::OP_NONE: $this->_loadNone(); break; case self::OP_NEWTRUE: $this->_loadNewTrue(); break; case self::OP_NEWFALSE: $this->_loadNewFalse(); break; case self::OP_INT: $this->_loadInt(); break; case self::OP_BININT: $this->_loadBinInt(); break; case self::OP_BININT1: $this->_loadBinInt1(); break; case self::OP_BININT2: $this->_loadBinInt2(); break; case self::OP_LONG: $this->_loadLong(); break; case self::OP_LONG1: $this->_loadLong1(); break; case self::OP_LONG4: $this->_loadLong4(); break; case self::OP_FLOAT: $this->_loadFloat(); break; case self::OP_BINFLOAT: $this->_loadBinFloat(); break; case self::OP_STRING: $this->_loadString(); break; case self::OP_BINSTRING: $this->_loadBinString(); break; case self::OP_SHORT_BINSTRING: $this->_loadShortBinString(); break; case self::OP_BINBYTES: $this->_loadBinBytes(); break; case self::OP_SHORT_BINBYTES: $this->_loadShortBinBytes(); break; case self::OP_UNICODE: $this->_loadUnicode(); break; case self::OP_BINUNICODE: $this->_loadBinUnicode(); break; case self::OP_MARK: $this->_loadMark(); break; case self::OP_LIST: $this->_loadList(); break; case self::OP_EMPTY_LIST: $this->_loadEmptyList(); break; case self::OP_APPEND: $this->_loadAppend(); break; case self::OP_APPENDS: $this->_loadAppends(); break; case self::OP_DICT: $this->_loadDict(); break; case self::OP_EMPTY_DICT: $this->_loadEmptyDict(); break; case self::OP_SETITEM: $this->_loadSetItem(); break; case self::OP_SETITEMS: $this->_loadSetItems(); break; case self::OP_TUPLE: $this->_loadTuple(); break; case self::OP_TUPLE1: $this->_loadTuple1(); break; case self::OP_TUPLE2: $this->_loadTuple2(); break; case self::OP_TUPLE3: $this->_loadTuple3(); break; case self::OP_PROTO: $this->_loadProto(); break; default: require_once 'Zend/Serializer/Exception.php'; throw new Zend_Serializer_Exception('Invalid or unknown opcode "'.$op.'"'); } } /** * Load a PUT opcode * * @return void * @throws Zend_Serializer_Exception on missing stack */ protected function _loadPut() { $id = (int)$this->_readline(); $lastStack = count($this->_stack)-1; if (!isset($this->_stack[$lastStack])) { require_once 'Zend/Serializer/Exception.php'; throw new Zend_Serializer_Exception('No stack exist'); } $this->_memo[$id] = & $this->_stack[$lastStack]; } /** * Load a binary PUT * * @return void * @throws Zend_Serializer_Exception on missing stack */ protected function _loadBinPut() { $id = ord($this->_read(1)); $lastStack = count($this->_stack)-1; if (!isset($this->_stack[$lastStack])) { require_once 'Zend/Serializer/Exception.php'; throw new Zend_Serializer_Exception('No stack exist'); } $this->_memo[$id] = & $this->_stack[$lastStack]; } /** * Load a long binary PUT * * @return void * @throws Zend_Serializer_Exception on missing stack */ protected function _loadLongBinPut() { $bin = $this->_read(4); if (self::$_isLittleEndian === false) { $bin = strrev($bin); } list(, $id) = unpack('l', $bin); $lastStack = count($this->_stack)-1; if (!isset($this->_stack[$lastStack])) { require_once 'Zend/Serializer/Exception.php'; throw new Zend_Serializer_Exception('No stack exist'); } $this->_memo[$id] = & $this->_stack[$lastStack]; } /** * Load a GET operation * * @return void * @throws Zend_Serializer_Exception on missing GET identifier */ protected function _loadGet() { $id = (int)$this->_readline(); if (!array_key_exists($id, $this->_memo)) { require_once 'Zend/Serializer/Exception.php'; throw new Zend_Serializer_Exception('Get id "' . $id . '" not found in momo'); } $this->_stack[] = & $this->_memo[$id]; } /** * Load a binary GET operation * * @return void * @throws Zend_Serializer_Exception on missing GET identifier */ protected function _loadBinGet() { $id = ord($this->_read(1)); if (!array_key_exists($id, $this->_memo)) { require_once 'Zend/Serializer/Exception.php'; throw new Zend_Serializer_Exception('Get id "' . $id . '" not found in momo'); } $this->_stack[] = & $this->_memo[$id]; } /** * Load a long binary GET operation * * @return void * @throws Zend_Serializer_Exception on missing GET identifier */ protected function _loadLongBinGet() { $bin = $this->_read(4); if (self::$_isLittleEndian === false) { $bin = strrev($bin); } list(, $id) = unpack('l', $bin); if (!array_key_exists($id, $this->_memo)) { require_once 'Zend/Serializer/Exception.php'; throw new Zend_Serializer_Exception('Get id "' . $id . '" not found in momo'); } $this->_stack[] = & $this->_memo[$id]; } /** * Load a NONE operator * * @return void */ protected function _loadNone() { $this->_stack[] = null; } /** * Load a boolean TRUE operator * * @return void */ protected function _loadNewTrue() { $this->_stack[] = true; } /** * Load a boolean FALSE operator * * @return void */ protected function _loadNewFalse() { $this->_stack[] = false; } /** * Load an integer operator * * @return void */ protected function _loadInt() { $line = $this->_readline(); if ($line === '01') { $this->_stack[] = true; } elseif ($line === '00') { $this->_stack[] = false; } else { $this->_stack[] = (int)$line; } } /** * Load a binary integer operator * * @return void */ protected function _loadBinInt() { $bin = $this->_read(4); if (self::$_isLittleEndian === false) { $bin = strrev($bin); } list(, $int) = unpack('l', $bin); $this->_stack[] = $int; } /** * Load the first byte of a binary integer * * @return void */ protected function _loadBinInt1() { $this->_stack[] = ord($this->_read(1)); } /** * Load the second byte of a binary integer * * @return void */ protected function _loadBinInt2() { $bin = $this->_read(2); list(, $int) = unpack('v', $bin); $this->_stack[] = $int; } /** * Load a long (float) operator * * @return void */ protected function _loadLong() { $data = rtrim($this->_readline(), 'L'); if ($data === '') { $this->_stack[] = 0; } else { $this->_stack[] = $data; } } /** * Load a one byte long integer * * @return void */ protected function _loadLong1() { $n = ord($this->_read(1)); $data = $this->_read($n); $this->_stack[] = $this->_decodeBinLong($data); } /** * Load a 4 byte long integer * * @return void */ protected function _loadLong4() { $nBin = $this->_read(4); if (self::$_isLittleEndian === false) { $nBin = strrev($$nBin); } list(, $n) = unpack('l', $nBin); $data = $this->_read($n); $this->_stack[] = $this->_decodeBinLong($data); } /** * Load a float value * * @return void */ protected function _loadFloat() { $float = (float)$this->_readline(); $this->_stack[] = $float; } /** * Load a binary float value * * @return void */ protected function _loadBinFloat() { $bin = $this->_read(8); if (self::$_isLittleEndian === true) { $bin = strrev($bin); } list(, $float) = unpack('d', $bin); $this->_stack[] = $float; } /** * Load a string * * @return void */ protected function _loadString() { $this->_stack[] = $this->_unquoteString((string)$this->_readline()); } /** * Load a binary string * * @return void */ protected function _loadBinString() { $bin = $this->_read(4); if (!self::$_isLittleEndian) { $bin = strrev($bin); } list(, $len) = unpack('l', $bin); $this->_stack[] = (string)$this->_read($len); } /** * Load a short binary string * * @return void */ protected function _loadShortBinString() { $len = ord($this->_read(1)); $this->_stack[] = (string)$this->_read($len); } /** * Load arbitrary binary bytes * * @return void */ protected function _loadBinBytes() { // read byte length $nBin = $this->_read(4); if (self::$_isLittleEndian === false) { $nBin = strrev($$nBin); } list(, $n) = unpack('l', $nBin); $this->_stack[] = $this->_read($n); } /** * Load a single binary byte * * @return void */ protected function _loadShortBinBytes() { $n = ord($this->_read(1)); $this->_stack[] = $this->_read($n); } /** * Load a unicode string * * @return void */ protected function _loadUnicode() { $data = $this->_readline(); $pattern = '/\\\\u([a-fA-F0-9]{4})/u'; // \uXXXX $data = preg_replace_callback($pattern, array($this, '_convertMatchingUnicodeSequence2Utf8'), $data); if (self::$_isPhp6) { $data = unicode_decode($data, 'UTF-8'); } $this->_stack[] = $data; } /** * Convert a unicode sequence to UTF-8 * * @param array $match * @return string */ protected function _convertMatchingUnicodeSequence2Utf8(array $match) { return $this->_hex2Utf8($match[1]); } /** * Convert a hex string to a UTF-8 string * * @param string $sequence * @return string * @throws Zend_Serializer_Exception on unmatched unicode sequence */ protected function _hex2Utf8($hex) { $uniCode = hexdec($hex); if ($uniCode < 0x80) { // 1Byte $utf8Char = chr($uniCode); } elseif ($uniCode < 0x800) { // 2Byte $utf8Char = chr(0xC0 | $uniCode >> 6) . chr(0x80 | $uniCode & 0x3F); } elseif ($uniCode < 0x10000) { // 3Byte $utf8Char = chr(0xE0 | $uniCode >> 12) . chr(0x80 | $uniCode >> 6 & 0x3F) . chr(0x80 | $uniCode & 0x3F); } elseif ($uniCode < 0x110000) { // 4Byte $utf8Char = chr(0xF0 | $uniCode >> 18) . chr(0x80 | $uniCode >> 12 & 0x3F) . chr(0x80 | $uniCode >> 6 & 0x3F) . chr(0x80 | $uniCode & 0x3F); } else { require_once 'Zend/Serializer/Exception.php'; throw new Zend_Serializer_Exception('Unsupported unicode character found "' . dechex($uniCode) . '"'); } return $utf8Char; } /** * Load binary unicode sequence * * @return void */ protected function _loadBinUnicode() { // read byte length $n = $this->_read(4); if (self::$_isLittleEndian === false) { $n = strrev($n); } list(, $n) = unpack('l', $n); $data = $this->_read($n); if (self::$_isPhp6) { $data = unicode_decode($data, 'UTF-8'); } $this->_stack[] = $data; } /** * Load a marker sequence * * @return void */ protected function _loadMark() { $this->_stack[] = $this->_marker; } /** * Load an array (list) * * @return void */ protected function _loadList() { $k = $this->_lastMarker(); $this->_stack[$k] = array(); // remove all elements after marker $max = count($this->_stack); for ($i = $k+1, $max; $i < $max; $i++) { unset($this->_stack[$i]); } } /** * Load an append (to list) sequence * * @return void */ protected function _loadAppend() { $value = array_pop($this->_stack); $list =& $this->_stack[count($this->_stack)-1]; $list[] = $value; } /** * Load an empty list sequence * * @return void */ protected function _loadEmptyList() { $this->_stack[] = array(); } /** * Load multiple append (to list) sequences at once * * @return void */ protected function _loadAppends() { $k = $this->_lastMarker(); $list =& $this->_stack[$k - 1]; $max = count($this->_stack); for ($i = $k + 1; $i < $max; $i++) { $list[] = $this->_stack[$i]; unset($this->_stack[$i]); } unset($this->_stack[$k]); } /** * Load an associative array (Python dictionary) * * @return void */ protected function _loadDict() { $k = $this->_lastMarker(); $this->_stack[$k] = array(); // remove all elements after marker $max = count($this->_stack); for($i = $k + 1; $i < $max; $i++) { unset($this->_stack[$i]); } } /** * Load an item from a set * * @return void */ protected function _loadSetItem() { $value = array_pop($this->_stack); $key = array_pop($this->_stack); $dict =& $this->_stack[count($this->_stack) - 1]; $dict[$key] = $value; } /** * Load an empty dictionary * * @return void */ protected function _loadEmptyDict() { $this->_stack[] = array(); } /** * Load set items * * @return void */ protected function _loadSetItems() { $k = $this->_lastMarker(); $dict =& $this->_stack[$k - 1]; $max = count($this->_stack); for ($i = $k + 1; $i < $max; $i += 2) { $key = $this->_stack[$i]; $value = $this->_stack[$i + 1]; $dict[$key] = $value; unset($this->_stack[$i], $this->_stack[$i+1]); } unset($this->_stack[$k]); } /** * Load a tuple * * @return void */ protected function _loadTuple() { $k = $this->_lastMarker(); $this->_stack[$k] = array(); $tuple =& $this->_stack[$k]; $max = count($this->_stack); for($i = $k + 1; $i < $max; $i++) { $tuple[] = $this->_stack[$i]; unset($this->_stack[$i]); } } /** * Load single item tuple * * @return void */ protected function _loadTuple1() { $value1 = array_pop($this->_stack); $this->_stack[] = array($value1); } /** * Load two item tuple * * @return void */ protected function _loadTuple2() { $value2 = array_pop($this->_stack); $value1 = array_pop($this->_stack); $this->_stack[] = array($value1, $value2); } /** * Load three item tuple * * @return void */ protected function _loadTuple3() { $value3 = array_pop($this->_stack); $value2 = array_pop($this->_stack); $value1 = array_pop($this->_stack); $this->_stack[] = array($value1, $value2, $value3); } /** * Load a proto value * * @return void * @throws Zend_Serializer_Exception if Pickle version does not support this feature */ protected function _loadProto() { $proto = ord($this->_read(1)); if ($proto < 2 || $proto > 3) { require_once 'Zend/Serializer/Exception.php'; throw new Zend_Serializer_Exception('Invalid protocol version detected'); } $this->_protocol = $proto; } /* unserialize helper */ /** * Read a segment of the pickle * * @param mixed $len * @return string * @throws Zend_Serializer_Exception if position matches end of data */ protected function _read($len) { if (($this->_pos + $len) > $this->_pickleLen) { require_once 'Zend/Serializer/Exception.php'; throw new Zend_Serializer_Exception('End of data'); } $this->_pos+= $len; return substr($this->_pickle, ($this->_pos - $len), $len); } /** * Read a line of the pickle at once * * @return string * @throws Zend_Serializer_Exception if no EOL character found */ protected function _readline() { $eolLen = 2; $eolPos = strpos($this->_pickle, "\r\n", $this->_pos); if ($eolPos === false) { $eolPos = strpos($this->_pickle, "\n", $this->_pos); $eolLen = 1; } if ($eolPos === false) { require_once 'Zend/Serializer/Exception.php'; throw new Zend_Serializer_Exception('No new line found'); } $ret = substr($this->_pickle, $this->_pos, $eolPos-$this->_pos); $this->_pos = $eolPos + $eolLen; return $ret; } /** * Unquote/Unescape a quoted string * * @param string $str quoted string * @return string unquoted string */ protected function _unquoteString($str) { $quoteArr = array_flip(self::$_quoteString); if ($str[0] == '"') { $quoteArr['\\"'] = '"'; } else { $quoteArr["\\'"] = "'"; } return strtr(substr(trim($str), 1, -1), $quoteArr); } /** * Return last marker position in stack * * @return int */ protected function _lastMarker() { for ($k = count($this->_stack)-1; $k >= 0; $k -= 1) { if ($this->_stack[$k] === $this->_marker) { break; } } return $k; } /** * Decode a binary long sequence * * @param string $data * @return int|float|string */ protected function _decodeBinLong($data) { $nbytes = strlen($data); if ($nbytes == 0) { return 0; } $long = 0; if ($nbytes > 7) { if (!extension_loaded('bcmath')) { return INF; } for ($i=0; $i<$nbytes; $i++) { $long = bcadd($long, bcmul(ord($data[$i]), bcpow(256, $i, 0))); } if (0x80 <= ord($data[$nbytes-1])) { $long = bcsub($long, bcpow(2, $nbytes * 8)); } } else { for ($i=0; $i<$nbytes; $i++) { $long+= ord($data[$i]) * pow(256, $i); } if (0x80 <= ord($data[$nbytes-1])) { $long-= pow(2, $nbytes * 8); // $long-= 1 << ($nbytes * 8); } } return $long; } }