1464 lines
40 KiB
PHP
1464 lines
40 KiB
PHP
<?php
|
|
/**
|
|
* Zend Framework
|
|
*
|
|
* LICENSE
|
|
*
|
|
* This source file is subject to the new BSD license that is bundled
|
|
* with this package in the file LICENSE.txt.
|
|
* It is also available through the world-wide-web at this URL:
|
|
* http://framework.zend.com/license/new-bsd
|
|
* If you did not receive a copy of the license and are unable to
|
|
* obtain it through the world-wide-web, please send an email
|
|
* to license@zend.com so we can send you a copy immediately.
|
|
*
|
|
* @category Zend
|
|
* @package Zend_Serializer
|
|
* @subpackage Adapter
|
|
* @copyright Copyright (c) 2005-2015 Zend Technologies USA Inc. (http://www.zend.com)
|
|
* @license http://framework.zend.com/license/new-bsd New BSD License
|
|
* @version $Id$
|
|
*/
|
|
|
|
/** @see Zend_Serializer_Adapter_AdapterAbstract */
|
|
|
|
/**
|
|
* @link http://www.python.org
|
|
* @see Phython3.1/Lib/pickle.py
|
|
* @see Phython3.1/Modules/_pickle.c
|
|
* @link http://pickle-js.googlecode.com
|
|
* @category Zend
|
|
* @package Zend_Serializer
|
|
* @subpackage Adapter
|
|
* @copyright Copyright (c) 2005-2015 Zend Technologies USA Inc. (http://www.zend.com)
|
|
* @license http://framework.zend.com/license/new-bsd New BSD License
|
|
*/
|
|
class Zend_Serializer_Adapter_PythonPickle extends Zend_Serializer_Adapter_AdapterAbstract
|
|
{
|
|
/* Pickle opcodes. See pickletools.py for extensive docs. The listing
|
|
here is in kind-of alphabetical order of 1-character pickle code.
|
|
pickletools groups them by purpose. */
|
|
const OP_MARK = '('; // push special markobject on stack
|
|
const OP_STOP = '.'; // every pickle ends with STOP
|
|
const OP_POP = '0'; // discard topmost stack item
|
|
const OP_POP_MARK = '1'; // discard stack top through topmost markobject
|
|
const OP_DUP = '2'; // duplicate top stack item
|
|
const OP_FLOAT = 'F'; // push float object; decimal string argument
|
|
const OP_INT = 'I'; // push integer or bool; decimal string argument
|
|
const OP_BININT = 'J'; // push four-byte signed int
|
|
const OP_BININT1 = 'K'; // push 1-byte unsigned int
|
|
const OP_LONG = 'L'; // push long; decimal string argument
|
|
const OP_BININT2 = 'M'; // push 2-byte unsigned int
|
|
const OP_NONE = 'N'; // push None
|
|
const OP_PERSID = 'P'; // push persistent object; id is taken from string arg
|
|
const OP_BINPERSID = 'Q'; // " " " ; " " " " stack
|
|
const OP_REDUCE = 'R'; // apply callable to argtuple, both on stack
|
|
const OP_STRING = 'S'; // push string; NL-terminated string argument
|
|
const OP_BINSTRING = 'T'; // push string; counted binary string argument
|
|
const OP_SHORT_BINSTRING = 'U'; // " " ; " " " " < 256 bytes
|
|
const OP_UNICODE = 'V'; // push Unicode string; raw-unicode-escaped'd argument
|
|
const OP_BINUNICODE = 'X'; // " " " ; counted UTF-8 string argument
|
|
const OP_APPEND = 'a'; // append stack top to list below it
|
|
const OP_BUILD = 'b'; // call __setstate__ or __dict__.update()
|
|
const OP_GLOBAL = 'c'; // push self.find_class(modname, name); 2 string args
|
|
const OP_DICT = 'd'; // build a dict from stack items
|
|
const OP_EMPTY_DICT = '}'; // push empty dict
|
|
const OP_APPENDS = 'e'; // extend list on stack by topmost stack slice
|
|
const OP_GET = 'g'; // push item from memo on stack; index is string arg
|
|
const OP_BINGET = 'h'; // " " " " " " ; " " 1-byte arg
|
|
const OP_INST = 'i'; // build & push class instance
|
|
const OP_LONG_BINGET = 'j'; // push item from memo on stack; index is 4-byte arg
|
|
const OP_LIST = 'l'; // build list from topmost stack items
|
|
const OP_EMPTY_LIST = ']'; // push empty list
|
|
const OP_OBJ = 'o'; // build & push class instance
|
|
const OP_PUT = 'p'; // store stack top in memo; index is string arg
|
|
const OP_BINPUT = 'q'; // " " " " " ; " " 1-byte arg
|
|
const OP_LONG_BINPUT = 'r'; // " " " " " ; " " 4-byte arg
|
|
const OP_SETITEM = 's'; // add key+value pair to dict
|
|
const OP_TUPLE = 't'; // build tuple from topmost stack items
|
|
const OP_EMPTY_TUPLE = ')'; // push empty tuple
|
|
const OP_SETITEMS = 'u'; // modify dict by adding topmost key+value pairs
|
|
const OP_BINFLOAT = 'G'; // push float; arg is 8-byte float encoding
|
|
|
|
/* Protocol 2 */
|
|
const OP_PROTO = "\x80"; // identify pickle protocol
|
|
const OP_NEWOBJ = "\x81"; // build object by applying cls.__new__ to argtuple
|
|
const OP_EXT1 = "\x82"; // push object from extension registry; 1-byte index
|
|
const OP_EXT2 = "\x83"; // ditto, but 2-byte index
|
|
const OP_EXT4 = "\x84"; // ditto, but 4-byte index
|
|
const OP_TUPLE1 = "\x85"; // build 1-tuple from stack top
|
|
const OP_TUPLE2 = "\x86"; // build 2-tuple from two topmost stack items
|
|
const OP_TUPLE3 = "\x87"; // build 3-tuple from three topmost stack items
|
|
const OP_NEWTRUE = "\x88"; // push True
|
|
const OP_NEWFALSE = "\x89"; // push False
|
|
const OP_LONG1 = "\x8a"; // push long from < 256 bytes
|
|
const OP_LONG4 = "\x8b"; // push really big long
|
|
|
|
/* Protocol 3 (Python 3.x) */
|
|
const OP_BINBYTES = 'B'; // push bytes; counted binary string argument
|
|
const OP_SHORT_BINBYTES = 'C'; // " " ; " " " " < 256 bytes
|
|
|
|
/**
|
|
* @var bool Whether or not the system is little-endian
|
|
*/
|
|
protected static $_isLittleEndian = null;
|
|
|
|
/**
|
|
* @var array Strings representing quotes
|
|
*/
|
|
protected static $_quoteString = array(
|
|
'\\' => '\\\\',
|
|
"\x00" => '\\x00', "\x01" => '\\x01', "\x02" => '\\x02', "\x03" => '\\x03',
|
|
"\x04" => '\\x04', "\x05" => '\\x05', "\x06" => '\\x06', "\x07" => '\\x07',
|
|
"\x08" => '\\x08', "\x09" => '\\t', "\x0a" => '\\n', "\x0b" => '\\x0b',
|
|
"\x0c" => '\\x0c', "\x0d" => '\\r', "\x0e" => '\\x0e', "\x0f" => '\\x0f',
|
|
"\x10" => '\\x10', "\x11" => '\\x11', "\x12" => '\\x12', "\x13" => '\\x13',
|
|
"\x14" => '\\x14', "\x15" => '\\x15', "\x16" => '\\x16', "\x17" => '\\x17',
|
|
"\x18" => '\\x18', "\x19" => '\\x19', "\x1a" => '\\x1a', "\x1b" => '\\x1b',
|
|
"\x1c" => '\\x1c', "\x1d" => '\\x1d', "\x1e" => '\\x1e', "\x1f" => '\\x1f',
|
|
"\xff" => '\\xff'
|
|
);
|
|
|
|
/**
|
|
* @var array Default options
|
|
*/
|
|
protected $_options = array(
|
|
'protocol' => 0,
|
|
);
|
|
|
|
// process vars
|
|
protected $_protocol = 0;
|
|
protected $_binary = false;
|
|
protected $_memo = array();
|
|
protected $_pickle = '';
|
|
protected $_pickleLen = 0;
|
|
protected $_pos = 0;
|
|
protected $_stack = array();
|
|
protected $_marker = null;
|
|
|
|
/**
|
|
* Constructor
|
|
*
|
|
* @link Zend_Serializer_Adapter_AdapterAbstract::__construct()
|
|
*/
|
|
public function __construct($opts=array())
|
|
{
|
|
parent::__construct($opts);
|
|
|
|
// init
|
|
if (self::$_isLittleEndian === null) {
|
|
self::$_isLittleEndian = (pack('l', 1) === "\x01\x00\x00\x00");
|
|
}
|
|
|
|
$this->_marker = new stdClass();
|
|
}
|
|
|
|
/**
|
|
* Set an option
|
|
*
|
|
* @link Zend_Serializer_Adapter_AdapterAbstract::setOption()
|
|
* @param string $name
|
|
* @param mixed $value
|
|
* @return Zend_Serializer_Adapter_PythonPickle
|
|
*/
|
|
public function setOption($name, $value)
|
|
{
|
|
switch ($name) {
|
|
case 'protocol':
|
|
$value = $this->_checkProtocolNumber($value);
|
|
break;
|
|
}
|
|
|
|
return parent::setOption($name, $value);
|
|
}
|
|
|
|
/**
|
|
* Check and normalize pickle protocol number
|
|
*
|
|
* @param int $number
|
|
* @return int
|
|
* @throws Zend_Serializer_Exception
|
|
*/
|
|
protected function _checkProtocolNumber($number)
|
|
{
|
|
$int = (int) $number;
|
|
if ($int < 0 || $int > 3) {
|
|
throw new Zend_Serializer_Exception('Invalid or unknown protocol version "'.$number.'"');
|
|
}
|
|
return $int;
|
|
}
|
|
|
|
/* serialize */
|
|
|
|
/**
|
|
* Serialize PHP to PythonPickle format
|
|
*
|
|
* @param mixed $value
|
|
* @param array $opts
|
|
* @return string
|
|
*/
|
|
public function serialize($value, array $opts = array())
|
|
{
|
|
$opts = $opts + $this->_options;
|
|
|
|
$this->_protocol = $this->_checkProtocolNumber($opts['protocol']);
|
|
$this->_binary = $this->_protocol != 0;
|
|
|
|
// clear process vars before serializing
|
|
$this->_memo = array();
|
|
$this->_pickle = '';
|
|
|
|
// write
|
|
if ($this->_protocol >= 2) {
|
|
$this->_writeProto($this->_protocol);
|
|
}
|
|
$this->_write($value);
|
|
$this->_writeStop();
|
|
|
|
// clear process vars after serializing
|
|
$this->_memo = array();
|
|
$pickle = $this->_pickle;
|
|
$this->_pickle = '';
|
|
|
|
return $pickle;
|
|
}
|
|
|
|
/**
|
|
* Write a value
|
|
*
|
|
* @param mixed $value
|
|
* @return void
|
|
* @throws Zend_Serializer_Exception on invalid or unrecognized value type
|
|
*/
|
|
protected function _write($value)
|
|
{
|
|
if ($value === null) {
|
|
$this->_writeNull();
|
|
} elseif ($value === true) {
|
|
$this->_writeTrue();
|
|
} elseif ($value === false) {
|
|
$this->_writeFalse();
|
|
} elseif (is_int($value)) {
|
|
$this->_writeInt($value);
|
|
} elseif (is_float($value)) {
|
|
$this->_writeFloat($value);
|
|
} elseif (is_string($value)) {
|
|
// TODO: write unicode / binary
|
|
$this->_writeString($value);
|
|
} elseif (is_array($value)) {
|
|
if ($this->_isArrayAssoc($value)) {
|
|
$this->_writeArrayDict($value);
|
|
} else {
|
|
$this->_writeArrayList($value);
|
|
}
|
|
} elseif (is_object($value)) {
|
|
$this->_writeObject($value);
|
|
} else {
|
|
throw new Zend_Serializer_Exception(
|
|
'PHP-Type "'.gettype($value).'" isn\'t serializable with '.get_class($this)
|
|
);
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Write pickle protocol
|
|
*
|
|
* @param int $protocol
|
|
* @return void
|
|
*/
|
|
protected function _writeProto($protocol)
|
|
{
|
|
$this->_pickle .= self::OP_PROTO . $protocol;
|
|
}
|
|
|
|
/**
|
|
* Write a get
|
|
*
|
|
* @param int $id Id of memo
|
|
* @return void
|
|
*/
|
|
protected function _writeGet($id)
|
|
{
|
|
if ($this->_binary) {
|
|
if ($id <= 0xff) {
|
|
// BINGET + chr(i)
|
|
$this->_pickle .= self::OP_BINGET . chr($id);
|
|
} else {
|
|
// LONG_BINGET + pack("<i", i)
|
|
$bin = pack('l', $id);
|
|
if (self::$_isLittleEndian === false) {
|
|
$bin = strrev($bin);
|
|
}
|
|
$this->_pickle .= self::OP_LONG_BINGET . $bin;
|
|
}
|
|
} else {
|
|
$this->_pickle .= self::OP_GET . $id . "\r\n";
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Write a put
|
|
*
|
|
* @param int $id Id of memo
|
|
* @return void
|
|
*/
|
|
protected function _writePut($id)
|
|
{
|
|
if ($this->_binary) {
|
|
if ($id <= 0xff) {
|
|
// BINPUT + chr(i)
|
|
$this->_pickle .= self::OP_BINPUT . chr($id);
|
|
} else {
|
|
// LONG_BINPUT + pack("<i", i)
|
|
$bin = pack('l', $id);
|
|
if (self::$_isLittleEndian === false) {
|
|
$bin = strrev($bin);
|
|
}
|
|
$this->_pickle .= self::OP_LONG_BINPUT . $bin;
|
|
}
|
|
} else {
|
|
$this->_pickle .= self::OP_PUT . $id . "\r\n";
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Write a null as None
|
|
*
|
|
* @return void
|
|
*/
|
|
protected function _writeNull()
|
|
{
|
|
$this->_pickle .= self::OP_NONE;
|
|
}
|
|
|
|
/**
|
|
* Write a boolean true
|
|
*
|
|
* @return void
|
|
*/
|
|
protected function _writeTrue()
|
|
{
|
|
if ($this->_protocol >= 2) {
|
|
$this->_pickle .= self::OP_NEWTRUE;
|
|
} else {
|
|
$this->_pickle .= self::OP_INT . "01\r\n";
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Write a boolean false
|
|
*
|
|
* @return void
|
|
*/
|
|
protected function _writeFalse()
|
|
{
|
|
if ($this->_protocol >= 2) {
|
|
$this->_pickle .= self::OP_NEWFALSE;
|
|
} else {
|
|
$this->_pickle .= self::OP_INT . "00\r\n";
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Write an integer value
|
|
*
|
|
* @param int $value
|
|
* @return void
|
|
*/
|
|
protected function _writeInt($value)
|
|
{
|
|
if ($this->_binary) {
|
|
if ($value >= 0) {
|
|
if ($value <= 0xff) {
|
|
// self.write(BININT1 + chr(obj))
|
|
$this->_pickle .= self::OP_BININT1 . chr($value);
|
|
} elseif ($value <= 0xffff) {
|
|
// self.write("%c%c%c" % (BININT2, obj&0xff, obj>>8))
|
|
$this->_pickle .= self::OP_BININT2 . pack('v', $value);
|
|
}
|
|
return;
|
|
}
|
|
|
|
// Next check for 4-byte signed ints:
|
|
$highBits = $value >> 31; // note that Python shift sign-extends
|
|
if ($highBits == 0 || $highBits == -1) {
|
|
// All high bits are copies of bit 2**31, so the value
|
|
// fits in a 4-byte signed int.
|
|
// self.write(BININT + pack("<i", obj))
|
|
$bin = pack('l', $value);
|
|
if (self::$_isLittleEndian === false) {
|
|
$bin = strrev($bin);
|
|
}
|
|
$this->_pickle .= self::OP_BININT . $bin;
|
|
return;
|
|
}
|
|
}
|
|
|
|
$this->_pickle .= self::OP_INT . $value . "\r\n";
|
|
}
|
|
|
|
/**
|
|
* Write a float value
|
|
*
|
|
* @param float $value
|
|
* @return void
|
|
*/
|
|
protected function _writeFloat($value)
|
|
{
|
|
if ($this->_binary) {
|
|
// self.write(BINFLOAT + pack('>d', obj))
|
|
$bin = pack('d', $value);
|
|
if (self::$_isLittleEndian === true) {
|
|
$bin = strrev($bin);
|
|
}
|
|
$this->_pickle .= self::OP_BINFLOAT . $bin;
|
|
} else {
|
|
$this->_pickle .= self::OP_FLOAT . $value . "\r\n";
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Write a string value
|
|
*
|
|
* @param string $value
|
|
* @return void
|
|
*/
|
|
protected function _writeString($value)
|
|
{
|
|
if ( ($id=$this->_searchMomo($value)) !== false ) {
|
|
$this->_writeGet($id);
|
|
return;
|
|
}
|
|
|
|
if ($this->_binary) {
|
|
$n = strlen($value);
|
|
if ($n <= 0xff) {
|
|
// self.write(SHORT_BINSTRING + chr(n) + obj)
|
|
$this->_pickle .= self::OP_SHORT_BINSTRING . chr($n) . $value;
|
|
} else {
|
|
// self.write(BINSTRING + pack("<i", n) + obj)
|
|
$binLen = pack('l', $n);
|
|
if (self::$_isLittleEndian === false) {
|
|
$binLen = strrev($binLen);
|
|
}
|
|
$this->_pickle .= self::OP_BINSTRING . $binLen . $value;
|
|
}
|
|
} else {
|
|
$this->_pickle .= self::OP_STRING . $this->_quoteString($value) . "\r\n";
|
|
}
|
|
|
|
$this->_momorize($value);
|
|
}
|
|
|
|
/**
|
|
* Write an associative array value as dictionary
|
|
*
|
|
* @param array $value
|
|
* @return void
|
|
*/
|
|
protected function _writeArrayDict(array $value)
|
|
{
|
|
if (($id=$this->_searchMomo($value)) !== false) {
|
|
$this->_writeGet($id);;
|
|
return;
|
|
}
|
|
|
|
$this->_pickle .= self::OP_MARK . self::OP_DICT;
|
|
$this->_momorize($value);
|
|
|
|
foreach ($value as $k => $v) {
|
|
$this->_pickle .= $this->_write($k)
|
|
. $this->_write($v)
|
|
. self::OP_SETITEM;
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Write a simple array value as list
|
|
*
|
|
* @param array $value
|
|
* @return void
|
|
*/
|
|
protected function _writeArrayList(array $value)
|
|
{
|
|
if (($id = $this->_searchMomo($value)) !== false) {
|
|
$this->_writeGet($id);
|
|
return;
|
|
}
|
|
|
|
$this->_pickle .= self::OP_MARK . self::OP_LIST;
|
|
$this->_momorize($value);
|
|
|
|
foreach ($value as $k => $v) {
|
|
$this->_pickle .= $this->_write($v) . self::OP_APPEND;
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Write an object as an dictionary
|
|
*
|
|
* @param object $value
|
|
* @return void
|
|
*/
|
|
protected function _writeObject($value)
|
|
{
|
|
// can't serialize php objects to python objects yet
|
|
$this->_writeArrayDict(get_object_vars($value));
|
|
}
|
|
|
|
/**
|
|
* Write stop
|
|
*
|
|
* @return void
|
|
*/
|
|
protected function _writeStop()
|
|
{
|
|
$this->_pickle .= self::OP_STOP;
|
|
}
|
|
|
|
/* serialize helper */
|
|
|
|
/**
|
|
* Add a value to the memo and write the id
|
|
*
|
|
* @param mixed $value
|
|
* @return void
|
|
*/
|
|
protected function _momorize($value)
|
|
{
|
|
$id = count($this->_memo);
|
|
$this->_memo[$id] = $value;
|
|
$this->_writePut($id);
|
|
}
|
|
|
|
/**
|
|
* Search a value in the meno and return the id
|
|
*
|
|
* @param mixed $value
|
|
* @return int|false The id or false
|
|
*/
|
|
protected function _searchMomo($value)
|
|
{
|
|
return array_search($value, $this->_memo, true);
|
|
}
|
|
|
|
/**
|
|
* Is an array associative?
|
|
*
|
|
* @param array $value
|
|
* @return boolean
|
|
*/
|
|
protected function _isArrayAssoc(array $value)
|
|
{
|
|
return array_diff_key($value, array_keys(array_keys($value)));
|
|
}
|
|
|
|
/**
|
|
* Quote/Escape a string
|
|
*
|
|
* @param string $str
|
|
* @return string quoted string
|
|
*/
|
|
protected function _quoteString($str)
|
|
{
|
|
$quoteArr = self::$_quoteString;
|
|
|
|
if (($cntSingleQuote = substr_count($str, "'"))
|
|
&& ($cntDoubleQuote = substr_count($str, '"'))
|
|
&& ($cntSingleQuote < $cntDoubleQuote)
|
|
) {
|
|
$quoteArr['"'] = '\\"';
|
|
$enclosure = '"';
|
|
} else {
|
|
$quoteArr["'"] = "\\'";
|
|
$enclosure = "'";
|
|
}
|
|
|
|
return $enclosure . strtr($str, $quoteArr) . $enclosure;
|
|
}
|
|
|
|
/* unserialize */
|
|
|
|
/**
|
|
* Unserialize from Python Pickle format to PHP
|
|
*
|
|
* @param string $pickle
|
|
* @param array $opts
|
|
* @return mixed
|
|
* @throws Zend_Serializer_Exception on invalid Pickle string
|
|
*/
|
|
public function unserialize($pickle, array $opts = array())
|
|
{
|
|
// init process vars
|
|
$this->_pos = 0;
|
|
$this->_pickle = $pickle;
|
|
$this->_pickleLen = strlen($this->_pickle);
|
|
$this->_memo = array();
|
|
$this->_stack = array();
|
|
|
|
// read pickle string
|
|
while (($op=$this->_read(1)) !== self::OP_STOP) {
|
|
$this->_load($op);
|
|
}
|
|
|
|
if (!count($this->_stack)) {
|
|
throw new Zend_Serializer_Exception('No data found');
|
|
}
|
|
|
|
$ret = array_pop($this->_stack);
|
|
|
|
// clear process vars
|
|
$this->_pos = 0;
|
|
$this->_pickle = '';
|
|
$this->_pickleLen = 0;
|
|
$this->_memo = array();
|
|
$this->_stack = array();
|
|
|
|
return $ret;
|
|
}
|
|
|
|
/**
|
|
* Load a pickle opcode
|
|
*
|
|
* @param string $op
|
|
* @return void
|
|
* @throws Zend_Serializer_Exception on invalid opcode
|
|
*/
|
|
protected function _load($op)
|
|
{
|
|
switch ($op) {
|
|
case self::OP_PUT:
|
|
$this->_loadPut();
|
|
break;
|
|
case self::OP_BINPUT:
|
|
$this->_loadBinPut();
|
|
break;
|
|
case self::OP_LONG_BINPUT:
|
|
$this->_loadLongBinPut();
|
|
break;
|
|
case self::OP_GET:
|
|
$this->_loadGet();
|
|
break;
|
|
case self::OP_BINGET:
|
|
$this->_loadBinGet();
|
|
break;
|
|
case self::OP_LONG_BINGET:
|
|
$this->_loadLongBinGet();
|
|
break;
|
|
case self::OP_NONE:
|
|
$this->_loadNone();
|
|
break;
|
|
case self::OP_NEWTRUE:
|
|
$this->_loadNewTrue();
|
|
break;
|
|
case self::OP_NEWFALSE:
|
|
$this->_loadNewFalse();
|
|
break;
|
|
case self::OP_INT:
|
|
$this->_loadInt();
|
|
break;
|
|
case self::OP_BININT:
|
|
$this->_loadBinInt();
|
|
break;
|
|
case self::OP_BININT1:
|
|
$this->_loadBinInt1();
|
|
break;
|
|
case self::OP_BININT2:
|
|
$this->_loadBinInt2();
|
|
break;
|
|
case self::OP_LONG:
|
|
$this->_loadLong();
|
|
break;
|
|
case self::OP_LONG1:
|
|
$this->_loadLong1();
|
|
break;
|
|
case self::OP_LONG4:
|
|
$this->_loadLong4();
|
|
break;
|
|
case self::OP_FLOAT:
|
|
$this->_loadFloat();
|
|
break;
|
|
case self::OP_BINFLOAT:
|
|
$this->_loadBinFloat();
|
|
break;
|
|
case self::OP_STRING:
|
|
$this->_loadString();
|
|
break;
|
|
case self::OP_BINSTRING:
|
|
$this->_loadBinString();
|
|
break;
|
|
case self::OP_SHORT_BINSTRING:
|
|
$this->_loadShortBinString();
|
|
break;
|
|
case self::OP_BINBYTES:
|
|
$this->_loadBinBytes();
|
|
break;
|
|
case self::OP_SHORT_BINBYTES:
|
|
$this->_loadShortBinBytes();
|
|
break;
|
|
case self::OP_UNICODE:
|
|
$this->_loadUnicode();
|
|
break;
|
|
case self::OP_BINUNICODE:
|
|
$this->_loadBinUnicode();
|
|
break;
|
|
case self::OP_MARK:
|
|
$this->_loadMark();
|
|
break;
|
|
case self::OP_LIST:
|
|
$this->_loadList();
|
|
break;
|
|
case self::OP_EMPTY_LIST:
|
|
$this->_loadEmptyList();
|
|
break;
|
|
case self::OP_APPEND:
|
|
$this->_loadAppend();
|
|
break;
|
|
case self::OP_APPENDS:
|
|
$this->_loadAppends();
|
|
break;
|
|
case self::OP_DICT:
|
|
$this->_loadDict();
|
|
break;
|
|
case self::OP_EMPTY_DICT:
|
|
$this->_loadEmptyDict();
|
|
break;
|
|
case self::OP_SETITEM:
|
|
$this->_loadSetItem();
|
|
break;
|
|
case self::OP_SETITEMS:
|
|
$this->_loadSetItems();
|
|
break;
|
|
case self::OP_TUPLE:
|
|
$this->_loadTuple();
|
|
break;
|
|
case self::OP_TUPLE1:
|
|
$this->_loadTuple1();
|
|
break;
|
|
case self::OP_TUPLE2:
|
|
$this->_loadTuple2();
|
|
break;
|
|
case self::OP_TUPLE3:
|
|
$this->_loadTuple3();
|
|
break;
|
|
case self::OP_PROTO:
|
|
$this->_loadProto();
|
|
break;
|
|
default:
|
|
throw new Zend_Serializer_Exception('Invalid or unknown opcode "'.$op.'"');
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Load a PUT opcode
|
|
*
|
|
* @return void
|
|
* @throws Zend_Serializer_Exception on missing stack
|
|
*/
|
|
protected function _loadPut()
|
|
{
|
|
$id = (int)$this->_readline();
|
|
|
|
$lastStack = count($this->_stack)-1;
|
|
if (!isset($this->_stack[$lastStack])) {
|
|
throw new Zend_Serializer_Exception('No stack exist');
|
|
}
|
|
$this->_memo[$id] = & $this->_stack[$lastStack];
|
|
}
|
|
|
|
/**
|
|
* Load a binary PUT
|
|
*
|
|
* @return void
|
|
* @throws Zend_Serializer_Exception on missing stack
|
|
*/
|
|
protected function _loadBinPut()
|
|
{
|
|
$id = ord($this->_read(1));
|
|
|
|
$lastStack = count($this->_stack)-1;
|
|
if (!isset($this->_stack[$lastStack])) {
|
|
throw new Zend_Serializer_Exception('No stack exist');
|
|
}
|
|
$this->_memo[$id] = & $this->_stack[$lastStack];
|
|
}
|
|
|
|
/**
|
|
* Load a long binary PUT
|
|
*
|
|
* @return void
|
|
* @throws Zend_Serializer_Exception on missing stack
|
|
*/
|
|
protected function _loadLongBinPut()
|
|
{
|
|
$bin = $this->_read(4);
|
|
if (self::$_isLittleEndian === false) {
|
|
$bin = strrev($bin);
|
|
}
|
|
list(, $id) = unpack('l', $bin);
|
|
|
|
$lastStack = count($this->_stack)-1;
|
|
if (!isset($this->_stack[$lastStack])) {
|
|
throw new Zend_Serializer_Exception('No stack exist');
|
|
}
|
|
$this->_memo[$id] = & $this->_stack[$lastStack];
|
|
}
|
|
|
|
/**
|
|
* Load a GET operation
|
|
*
|
|
* @return void
|
|
* @throws Zend_Serializer_Exception on missing GET identifier
|
|
*/
|
|
protected function _loadGet()
|
|
{
|
|
$id = (int)$this->_readline();
|
|
|
|
if (!array_key_exists($id, $this->_memo)) {
|
|
throw new Zend_Serializer_Exception('Get id "' . $id . '" not found in momo');
|
|
}
|
|
$this->_stack[] = & $this->_memo[$id];
|
|
}
|
|
|
|
/**
|
|
* Load a binary GET operation
|
|
*
|
|
* @return void
|
|
* @throws Zend_Serializer_Exception on missing GET identifier
|
|
*/
|
|
protected function _loadBinGet()
|
|
{
|
|
$id = ord($this->_read(1));
|
|
|
|
if (!array_key_exists($id, $this->_memo)) {
|
|
throw new Zend_Serializer_Exception('Get id "' . $id . '" not found in momo');
|
|
}
|
|
$this->_stack[] = & $this->_memo[$id];
|
|
}
|
|
|
|
/**
|
|
* Load a long binary GET operation
|
|
*
|
|
* @return void
|
|
* @throws Zend_Serializer_Exception on missing GET identifier
|
|
*/
|
|
protected function _loadLongBinGet()
|
|
{
|
|
$bin = $this->_read(4);
|
|
if (self::$_isLittleEndian === false) {
|
|
$bin = strrev($bin);
|
|
}
|
|
list(, $id) = unpack('l', $bin);
|
|
|
|
if (!array_key_exists($id, $this->_memo)) {
|
|
throw new Zend_Serializer_Exception('Get id "' . $id . '" not found in momo');
|
|
}
|
|
$this->_stack[] = & $this->_memo[$id];
|
|
}
|
|
|
|
/**
|
|
* Load a NONE operator
|
|
*
|
|
* @return void
|
|
*/
|
|
protected function _loadNone()
|
|
{
|
|
$this->_stack[] = null;
|
|
}
|
|
|
|
/**
|
|
* Load a boolean TRUE operator
|
|
*
|
|
* @return void
|
|
*/
|
|
protected function _loadNewTrue()
|
|
{
|
|
$this->_stack[] = true;
|
|
}
|
|
|
|
/**
|
|
* Load a boolean FALSE operator
|
|
*
|
|
* @return void
|
|
*/
|
|
protected function _loadNewFalse()
|
|
{
|
|
$this->_stack[] = false;
|
|
}
|
|
|
|
/**
|
|
* Load an integer operator
|
|
*
|
|
* @return void
|
|
*/
|
|
protected function _loadInt()
|
|
{
|
|
$line = $this->_readline();
|
|
if ($line === '01') {
|
|
$this->_stack[] = true;
|
|
} elseif ($line === '00') {
|
|
$this->_stack[] = false;
|
|
} else {
|
|
$this->_stack[] = (int)$line;
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Load a binary integer operator
|
|
*
|
|
* @return void
|
|
*/
|
|
protected function _loadBinInt()
|
|
{
|
|
$bin = $this->_read(4);
|
|
if (self::$_isLittleEndian === false) {
|
|
$bin = strrev($bin);
|
|
}
|
|
list(, $int) = unpack('l', $bin);
|
|
$this->_stack[] = $int;
|
|
}
|
|
|
|
/**
|
|
* Load the first byte of a binary integer
|
|
*
|
|
* @return void
|
|
*/
|
|
protected function _loadBinInt1()
|
|
{
|
|
$this->_stack[] = ord($this->_read(1));
|
|
}
|
|
|
|
/**
|
|
* Load the second byte of a binary integer
|
|
*
|
|
* @return void
|
|
*/
|
|
protected function _loadBinInt2()
|
|
{
|
|
$bin = $this->_read(2);
|
|
list(, $int) = unpack('v', $bin);
|
|
$this->_stack[] = $int;
|
|
}
|
|
|
|
/**
|
|
* Load a long (float) operator
|
|
*
|
|
* @return void
|
|
*/
|
|
protected function _loadLong()
|
|
{
|
|
$data = rtrim($this->_readline(), 'L');
|
|
if ($data === '') {
|
|
$this->_stack[] = 0;
|
|
} else {
|
|
$this->_stack[] = $data;
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Load a one byte long integer
|
|
*
|
|
* @return void
|
|
*/
|
|
protected function _loadLong1()
|
|
{
|
|
$n = ord($this->_read(1));
|
|
$data = $this->_read($n);
|
|
$this->_stack[] = $this->_decodeBinLong($data);
|
|
}
|
|
|
|
/**
|
|
* Load a 4 byte long integer
|
|
*
|
|
* @return void
|
|
*/
|
|
protected function _loadLong4()
|
|
{
|
|
$nBin = $this->_read(4);
|
|
if (self::$_isLittleEndian === false) {
|
|
$nBin = strrev($$nBin);
|
|
}
|
|
list(, $n) = unpack('l', $nBin);
|
|
$data = $this->_read($n);
|
|
|
|
$this->_stack[] = $this->_decodeBinLong($data);
|
|
}
|
|
|
|
/**
|
|
* Load a float value
|
|
*
|
|
* @return void
|
|
*/
|
|
protected function _loadFloat()
|
|
{
|
|
$float = (float)$this->_readline();
|
|
$this->_stack[] = $float;
|
|
}
|
|
|
|
/**
|
|
* Load a binary float value
|
|
*
|
|
* @return void
|
|
*/
|
|
protected function _loadBinFloat()
|
|
{
|
|
$bin = $this->_read(8);
|
|
if (self::$_isLittleEndian === true) {
|
|
$bin = strrev($bin);
|
|
}
|
|
list(, $float) = unpack('d', $bin);
|
|
$this->_stack[] = $float;
|
|
}
|
|
|
|
/**
|
|
* Load a string
|
|
*
|
|
* @return void
|
|
*/
|
|
protected function _loadString()
|
|
{
|
|
$this->_stack[] = $this->_unquoteString((string)$this->_readline());
|
|
}
|
|
|
|
/**
|
|
* Load a binary string
|
|
*
|
|
* @return void
|
|
*/
|
|
protected function _loadBinString()
|
|
{
|
|
$bin = $this->_read(4);
|
|
if (!self::$_isLittleEndian) {
|
|
$bin = strrev($bin);
|
|
}
|
|
list(, $len) = unpack('l', $bin);
|
|
$this->_stack[] = (string)$this->_read($len);
|
|
}
|
|
|
|
/**
|
|
* Load a short binary string
|
|
*
|
|
* @return void
|
|
*/
|
|
protected function _loadShortBinString()
|
|
{
|
|
$len = ord($this->_read(1));
|
|
$this->_stack[] = (string)$this->_read($len);
|
|
}
|
|
|
|
/**
|
|
* Load arbitrary binary bytes
|
|
*
|
|
* @return void
|
|
*/
|
|
protected function _loadBinBytes()
|
|
{
|
|
// read byte length
|
|
$nBin = $this->_read(4);
|
|
if (self::$_isLittleEndian === false) {
|
|
$nBin = strrev($$nBin);
|
|
}
|
|
list(, $n) = unpack('l', $nBin);
|
|
$this->_stack[] = $this->_read($n);
|
|
}
|
|
|
|
/**
|
|
* Load a single binary byte
|
|
*
|
|
* @return void
|
|
*/
|
|
protected function _loadShortBinBytes()
|
|
{
|
|
$n = ord($this->_read(1));
|
|
$this->_stack[] = $this->_read($n);
|
|
}
|
|
|
|
/**
|
|
* Load a unicode string
|
|
*
|
|
* @return void
|
|
*/
|
|
protected function _loadUnicode()
|
|
{
|
|
$data = $this->_readline();
|
|
$pattern = '/\\\\u([a-fA-F0-9]{4})/u'; // \uXXXX
|
|
$data = preg_replace_callback($pattern, array($this, '_convertMatchingUnicodeSequence2Utf8'), $data);
|
|
|
|
$this->_stack[] = $data;
|
|
}
|
|
|
|
/**
|
|
* Convert a unicode sequence to UTF-8
|
|
*
|
|
* @param array $match
|
|
* @return string
|
|
*/
|
|
protected function _convertMatchingUnicodeSequence2Utf8(array $match)
|
|
{
|
|
return $this->_hex2Utf8($match[1]);
|
|
}
|
|
|
|
/**
|
|
* Convert a hex string to a UTF-8 string
|
|
*
|
|
* @param string $sequence
|
|
* @return string
|
|
* @throws Zend_Serializer_Exception on unmatched unicode sequence
|
|
*/
|
|
protected function _hex2Utf8($hex)
|
|
{
|
|
$uniCode = hexdec($hex);
|
|
|
|
if ($uniCode < 0x80) { // 1Byte
|
|
$utf8Char = chr($uniCode);
|
|
|
|
} elseif ($uniCode < 0x800) { // 2Byte
|
|
$utf8Char = chr(0xC0 | $uniCode >> 6)
|
|
. chr(0x80 | $uniCode & 0x3F);
|
|
|
|
} elseif ($uniCode < 0x10000) { // 3Byte
|
|
$utf8Char = chr(0xE0 | $uniCode >> 12)
|
|
. chr(0x80 | $uniCode >> 6 & 0x3F)
|
|
. chr(0x80 | $uniCode & 0x3F);
|
|
|
|
} elseif ($uniCode < 0x110000) { // 4Byte
|
|
$utf8Char = chr(0xF0 | $uniCode >> 18)
|
|
. chr(0x80 | $uniCode >> 12 & 0x3F)
|
|
. chr(0x80 | $uniCode >> 6 & 0x3F)
|
|
. chr(0x80 | $uniCode & 0x3F);
|
|
} else {
|
|
throw new Zend_Serializer_Exception('Unsupported unicode character found "' . dechex($uniCode) . '"');
|
|
}
|
|
|
|
return $utf8Char;
|
|
}
|
|
|
|
/**
|
|
* Load binary unicode sequence
|
|
*
|
|
* @return void
|
|
*/
|
|
protected function _loadBinUnicode()
|
|
{
|
|
// read byte length
|
|
$n = $this->_read(4);
|
|
if (self::$_isLittleEndian === false) {
|
|
$n = strrev($n);
|
|
}
|
|
list(, $n) = unpack('l', $n);
|
|
$data = $this->_read($n);
|
|
|
|
$this->_stack[] = $data;
|
|
}
|
|
|
|
/**
|
|
* Load a marker sequence
|
|
*
|
|
* @return void
|
|
*/
|
|
protected function _loadMark()
|
|
{
|
|
$this->_stack[] = $this->_marker;
|
|
}
|
|
|
|
/**
|
|
* Load an array (list)
|
|
*
|
|
* @return void
|
|
*/
|
|
protected function _loadList()
|
|
{
|
|
$k = $this->_lastMarker();
|
|
$this->_stack[$k] = array();
|
|
|
|
// remove all elements after marker
|
|
$max = count($this->_stack);
|
|
for ($i = $k+1, $max; $i < $max; $i++) {
|
|
unset($this->_stack[$i]);
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Load an append (to list) sequence
|
|
*
|
|
* @return void
|
|
*/
|
|
protected function _loadAppend()
|
|
{
|
|
$value = array_pop($this->_stack);
|
|
$list =& $this->_stack[count($this->_stack)-1];
|
|
$list[] = $value;
|
|
}
|
|
|
|
/**
|
|
* Load an empty list sequence
|
|
*
|
|
* @return void
|
|
*/
|
|
protected function _loadEmptyList()
|
|
{
|
|
$this->_stack[] = array();
|
|
}
|
|
|
|
/**
|
|
* Load multiple append (to list) sequences at once
|
|
*
|
|
* @return void
|
|
*/
|
|
protected function _loadAppends()
|
|
{
|
|
$k = $this->_lastMarker();
|
|
$list =& $this->_stack[$k - 1];
|
|
$max = count($this->_stack);
|
|
for ($i = $k + 1; $i < $max; $i++) {
|
|
$list[] = $this->_stack[$i];
|
|
unset($this->_stack[$i]);
|
|
}
|
|
unset($this->_stack[$k]);
|
|
}
|
|
|
|
/**
|
|
* Load an associative array (Python dictionary)
|
|
*
|
|
* @return void
|
|
*/
|
|
protected function _loadDict()
|
|
{
|
|
$k = $this->_lastMarker();
|
|
$this->_stack[$k] = array();
|
|
|
|
// remove all elements after marker
|
|
$max = count($this->_stack);
|
|
for($i = $k + 1; $i < $max; $i++) {
|
|
unset($this->_stack[$i]);
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Load an item from a set
|
|
*
|
|
* @return void
|
|
*/
|
|
protected function _loadSetItem()
|
|
{
|
|
$value = array_pop($this->_stack);
|
|
$key = array_pop($this->_stack);
|
|
$dict =& $this->_stack[count($this->_stack) - 1];
|
|
$dict[$key] = $value;
|
|
}
|
|
|
|
/**
|
|
* Load an empty dictionary
|
|
*
|
|
* @return void
|
|
*/
|
|
protected function _loadEmptyDict()
|
|
{
|
|
$this->_stack[] = array();
|
|
}
|
|
|
|
/**
|
|
* Load set items
|
|
*
|
|
* @return void
|
|
*/
|
|
protected function _loadSetItems()
|
|
{
|
|
$k = $this->_lastMarker();
|
|
$dict =& $this->_stack[$k - 1];
|
|
$max = count($this->_stack);
|
|
for ($i = $k + 1; $i < $max; $i += 2) {
|
|
$key = $this->_stack[$i];
|
|
$value = $this->_stack[$i + 1];
|
|
$dict[$key] = $value;
|
|
unset($this->_stack[$i], $this->_stack[$i+1]);
|
|
}
|
|
unset($this->_stack[$k]);
|
|
}
|
|
|
|
/**
|
|
* Load a tuple
|
|
*
|
|
* @return void
|
|
*/
|
|
protected function _loadTuple()
|
|
{
|
|
$k = $this->_lastMarker();
|
|
$this->_stack[$k] = array();
|
|
$tuple =& $this->_stack[$k];
|
|
$max = count($this->_stack);
|
|
for($i = $k + 1; $i < $max; $i++) {
|
|
$tuple[] = $this->_stack[$i];
|
|
unset($this->_stack[$i]);
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Load single item tuple
|
|
*
|
|
* @return void
|
|
*/
|
|
protected function _loadTuple1()
|
|
{
|
|
$value1 = array_pop($this->_stack);
|
|
$this->_stack[] = array($value1);
|
|
}
|
|
|
|
/**
|
|
* Load two item tuple
|
|
*
|
|
* @return void
|
|
*/
|
|
protected function _loadTuple2()
|
|
{
|
|
$value2 = array_pop($this->_stack);
|
|
$value1 = array_pop($this->_stack);
|
|
$this->_stack[] = array($value1, $value2);
|
|
}
|
|
|
|
/**
|
|
* Load three item tuple
|
|
*
|
|
* @return void
|
|
*/
|
|
protected function _loadTuple3() {
|
|
$value3 = array_pop($this->_stack);
|
|
$value2 = array_pop($this->_stack);
|
|
$value1 = array_pop($this->_stack);
|
|
$this->_stack[] = array($value1, $value2, $value3);
|
|
}
|
|
|
|
/**
|
|
* Load a proto value
|
|
*
|
|
* @return void
|
|
* @throws Zend_Serializer_Exception if Pickle version does not support this feature
|
|
*/
|
|
protected function _loadProto()
|
|
{
|
|
$proto = ord($this->_read(1));
|
|
if ($proto < 2 || $proto > 3) {
|
|
throw new Zend_Serializer_Exception('Invalid protocol version detected');
|
|
}
|
|
$this->_protocol = $proto;
|
|
}
|
|
|
|
/* unserialize helper */
|
|
|
|
/**
|
|
* Read a segment of the pickle
|
|
*
|
|
* @param mixed $len
|
|
* @return string
|
|
* @throws Zend_Serializer_Exception if position matches end of data
|
|
*/
|
|
protected function _read($len)
|
|
{
|
|
if (($this->_pos + $len) > $this->_pickleLen) {
|
|
throw new Zend_Serializer_Exception('End of data');
|
|
}
|
|
|
|
$this->_pos+= $len;
|
|
return substr($this->_pickle, ($this->_pos - $len), $len);
|
|
}
|
|
|
|
/**
|
|
* Read a line of the pickle at once
|
|
*
|
|
* @return string
|
|
* @throws Zend_Serializer_Exception if no EOL character found
|
|
*/
|
|
protected function _readline()
|
|
{
|
|
$eolLen = 2;
|
|
$eolPos = strpos($this->_pickle, "\r\n", $this->_pos);
|
|
if ($eolPos === false) {
|
|
$eolPos = strpos($this->_pickle, "\n", $this->_pos);
|
|
$eolLen = 1;
|
|
}
|
|
|
|
if ($eolPos === false) {
|
|
throw new Zend_Serializer_Exception('No new line found');
|
|
}
|
|
$ret = substr($this->_pickle, $this->_pos, $eolPos-$this->_pos);
|
|
$this->_pos = $eolPos + $eolLen;
|
|
|
|
return $ret;
|
|
}
|
|
|
|
/**
|
|
* Unquote/Unescape a quoted string
|
|
*
|
|
* @param string $str quoted string
|
|
* @return string unquoted string
|
|
*/
|
|
protected function _unquoteString($str)
|
|
{
|
|
$quoteArr = array_flip(self::$_quoteString);
|
|
|
|
if ($str[0] == '"') {
|
|
$quoteArr['\\"'] = '"';
|
|
} else {
|
|
$quoteArr["\\'"] = "'";
|
|
}
|
|
|
|
return strtr(substr(trim($str), 1, -1), $quoteArr);
|
|
}
|
|
|
|
/**
|
|
* Return last marker position in stack
|
|
*
|
|
* @return int
|
|
*/
|
|
protected function _lastMarker()
|
|
{
|
|
for ($k = count($this->_stack)-1; $k >= 0; $k -= 1) {
|
|
if ($this->_stack[$k] === $this->_marker) {
|
|
break;
|
|
}
|
|
}
|
|
return $k;
|
|
}
|
|
|
|
/**
|
|
* Decode a binary long sequence
|
|
*
|
|
* @param string $data
|
|
* @return int|float|string
|
|
*/
|
|
protected function _decodeBinLong($data)
|
|
{
|
|
$nbytes = strlen($data);
|
|
|
|
if ($nbytes == 0) {
|
|
return 0;
|
|
}
|
|
|
|
$long = 0;
|
|
|
|
if ($nbytes > 7) {
|
|
if (!extension_loaded('bcmath')) {
|
|
return INF;
|
|
}
|
|
|
|
for ($i=0; $i<$nbytes; $i++) {
|
|
$long = bcadd($long, bcmul(ord($data[$i]), bcpow(256, $i, 0)));
|
|
}
|
|
if (0x80 <= ord($data[$nbytes-1])) {
|
|
$long = bcsub($long, bcpow(2, $nbytes * 8));
|
|
}
|
|
|
|
} else {
|
|
for ($i=0; $i<$nbytes; $i++) {
|
|
$long+= ord($data[$i]) * pow(256, $i);
|
|
}
|
|
if (0x80 <= ord($data[$nbytes-1])) {
|
|
$long-= pow(2, $nbytes * 8);
|
|
// $long-= 1 << ($nbytes * 8);
|
|
}
|
|
}
|
|
|
|
return $long;
|
|
}
|
|
}
|