-
Notifications
You must be signed in to change notification settings - Fork 38
/
Copy pathSerialize.pm
437 lines (371 loc) · 12.8 KB
/
Serialize.pm
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
# Movable Type (r) Open Source (C) 2001-2010 Six Apart, Ltd.
# This program is distributed under the terms of the
# GNU General Public License, version 2.
#
# $Id$
package MT::Serialize;
use strict;
our $VERSION = 5;
{
my %Types = (
Storable => [ \&_freeze_storable, \&_thaw_storable ],
JSON => [ \&_freeze_json, \&_thaw_json ],
MT => [ \&_freeze_mt_5, \&_thaw_mt ],
MT2 => [ \&_freeze_mt_2, \&_thaw_mt ],
MTS => [ \&_freeze_mt_storable, \&_thaw_mt ],
MTJ => [ \&_freeze_mt_json, \&_thaw_mt ],
);
sub new {
my $class = shift;
my $type = $Types{ $_[0] };
bless { freeze => $type->[0], thaw => $type->[1] }, $class;
}
}
my $default_serializer;
sub _default_serializer {
return $default_serializer if $default_serializer;
$default_serializer = new MT::Serialize( MT->config->Serializer );
}
sub serialize {
my $ser = shift;
$ser = _default_serializer unless ref $ser;
$ser->{freeze}->(@_);
}
sub unserialize {
my $ser = shift;
$ser = _default_serializer unless ref $ser;
$ser->{thaw}->(@_);
}
sub _freeze_storable { require Storable; Storable::freeze(@_) }
sub _thaw_storable { require Storable; Storable::thaw(@_) }
sub _freeze_json { require JSON; JSON::encode_json( ${ $_[0] } ) }
sub _thaw_json { require JSON; \JSON::decode_json(shift) }
# for compatibility, in case this routine is referenced directly
# by plugins...
sub _freeze_mt {
&_freeze_mt_1;
}
sub _freeze_mt_1 {
my ($ref) = @_;
my $frozen = 'SERG';
for my $col ( keys %{$$ref} ) {
my $col_val = ${$ref}->{$col};
$col_val = '' unless defined $col_val;
no_utf8($col_val);
$frozen
.= pack( 'N', length($col) )
. $col
. pack( 'N', length($col_val) )
. $col_val;
}
$frozen;
}
sub _macrofreeze {
use bytes;
my $value = shift;
my $ref_cnt = 1; # for compatibility with the existing algorithm
my %refs;
my $frozen = '';
my @stack;
while (1) {
if (@stack) {
my $top = $stack[-1];
if ( $top->[0] eq 'ARRAY' || $top->[0] eq 'REF' ) {
$value = splice @$top, 1, 1;
}
elsif ( $top->[0] eq 'HASH' ) {
( my ($key), $value ) = splice @$top, 1, 2;
$frozen .= pack( 'N', length($key) ) . $key;
}
else {
die "Unexpected type '@{[$top->[0]]}' in _macrofreeze\n";
}
pop @stack if @$top <= 1;
}
my $ref = ref $value;
if ($ref) {
if ( exists $refs{$value} ) {
$frozen .= 'P' . pack( 'N', $refs{$value} );
}
else {
$refs{$value} = $ref_cnt++;
if ( $ref !~ /^(HASH|ARRAY|SCALAR|REF)$/ ) {
# unknown reference type-- CODE or foreign package?
$value = \undef;
$ref = 'REF';
}
if ( $ref eq 'SCALAR' ) {
no_utf8($$value);
$frozen .= 'S' . pack( 'N', length($$value) ) . $$value;
}
elsif ( $ref eq 'REF' ) {
$frozen .= 'R';
push( @stack, [ 'REF' => $$value ] );
}
elsif ( $ref eq 'ARRAY' ) {
$frozen .= 'A' . pack( 'N', scalar(@$value) );
push( @stack, [ 'ARRAY' => @$value ] ) if scalar @$value;
}
elsif ( $ref eq 'HASH' ) {
$frozen .= 'H' . pack( 'N', scalar( keys %$value ) );
push( @stack, [ 'HASH' => %$value ] ) if keys %$value;
}
else {
die "Unexpected type '$ref' in _macrofreeze\n";
}
} ## end else [ if ( exists $refs{$value...})]
} ## end if ($ref)
else {
if ( defined $value ) {
no_utf8($value);
$frozen .= '-' . pack( 'N', length($value) ) . $value;
}
else {
$frozen .= 'U';
}
}
last if !@stack;
} ## end while (1)
return $frozen;
} ## end sub _macrofreeze
sub _freeze_mt_2 {
my ($ref) = @_;
# version 2 signature: 'SERG' + packed long 0 + packed long protocol
'SERG' . pack( 'N', 0 ) . pack( 'N', 2 ) . _macrofreeze($$ref);
}
sub _freeze_mt_storable {
my ($ref) = @_;
# version 3 signature: 'SERG' + packed long 0 + packed long protocol
require Storable;
'SERG' . pack( 'N', 0 ) . pack( 'N', 3 ) . Storable::nfreeze($$ref);
}
sub _freeze_mt_json {
my ($ref) = @_;
# version 3 signature: 'SERG' + packed long 0 + packed long protocol
require JSON;
'SERG' . pack( 'N', 0 ) . pack( 'N', 4 ) . JSON::encode_json($$ref);
}
sub no_utf8 {
for (@_) {
next if ref;
$_ = pack 'C0A*', $_;
}
}
sub _freeze_mt_5 {
my $enc = MT->config('PublishCharset') || 'UTF-8';
no warnings 'redefine';
local *no_utf8 = sub {
for (@_) {
next if ref;
$_ = Encode::encode( $enc, $_ ) if Encode::is_utf8($_);
}
};
_freeze_mt_2(@_);
}
sub _thaw_mt {
my ($frozen) = @_;
return \{} unless $frozen && substr( $frozen, 0, 4 ) eq 'SERG';
my $n = unpack 'N', substr( $frozen, 4, 4 );
if ( $n == 0 ) {
my $v = unpack 'N', substr( $frozen, 8, 4 );
if ( ( $v > 0 ) && ( $v <= $VERSION ) ) {
my $thaw = '_thaw_mt_' . $v;
no strict 'refs';
return $thaw->($frozen);
}
else {
return \{};
}
}
else {
_thaw_mt_1($frozen);
}
}
sub _thaw_mt_1 {
my ($frozen) = @_;
return unless substr( $frozen, 0, 4 ) eq 'SERG';
substr( $frozen, 0, 4 ) = '';
my $thawed = {};
my $len = length $frozen;
my $pos = 0;
while ( $pos < $len ) {
my $slen = unpack 'N', substr( $frozen, $pos, 4 );
my $col = $slen ? substr( $frozen, $pos + 4, $slen ) : '';
$pos += 4 + $slen;
$slen = unpack 'N', substr( $frozen, $pos, 4 );
my $col_val = substr( $frozen, $pos + 4, $slen );
$pos += 4 + $slen;
$thawed->{$col} = $col_val;
}
\$thawed;
}
sub _macrowave {
use bytes;
@_ == 2 or die "_macrowave expects: \$frozen, \$pos\n";
my ( $frozen, $pos ) = @_;
my $refs = [undef];
my $len = length $frozen;
my ( @stack, $value );
my $enc = MT->app->config('PublishCharset') || 'UTF-8';
while ( $pos < $len ) {
my $type = substr( $frozen, $pos, 1 );
$pos++;
my $newref;
$value = $type eq 'H'
? do { # hashref
my $keys = unpack 'N', substr( $frozen, $pos, 4 );
$pos += 4;
my $values = {};
push @$refs, $values;
$newref = [ $values, $keys ];
$values;
}
: $type eq 'A' ? do { # arrayref
my $array_count = unpack 'N', substr( $frozen, $pos, 4 );
$pos += 4;
my $values = [];
push @$refs, $values;
$newref = [ $values, $array_count ];
$values;
}
: $type eq 'S' ? do { # scalarref
my $slen = unpack 'N', substr( $frozen, $pos, 4 );
my $col_val = substr( $frozen, $pos + 4, $slen );
$col_val = Encode::decode( $enc, $col_val )
if !( Encode::is_utf8($col_val) );
$pos += 4 + $slen;
push @$refs, \$col_val;
\$col_val;
}
: $type eq 'R' ? do { # refref
my $value = \(undef);
push @$refs, $value;
$newref = [ $value, 1 ];
$value;
}
: $type eq '-' ? do { # scalar value
my $slen = unpack 'N', substr( $frozen, $pos, 4 );
my $col_val = substr( $frozen, $pos + 4, $slen );
$col_val = Encode::decode( $enc, $col_val )
if !( Encode::is_utf8($col_val) );
$pos += 4 + $slen;
$col_val;
}
: $type eq 'U' ? do { # undef
undef;
}
: $type eq 'P' ? do { # pointer to known ref
my $ptr = unpack 'N', substr( $frozen, $pos, 4 );
$pos += 4;
$refs->[$ptr];
}
: undef;
# if there is something on the stack, it has to be a complex ref (ARRAY, HASH, REF), then process it
if (@stack) {
my $top = $stack[-1];
my $more = --$top->[1];
if ( ref $top->[0] eq 'HASH' ) {
$top->[0]->{ $top->[2] } = $value;
}
elsif ( ref $top->[0] eq 'ARRAY' ) {
push( @{ $top->[0] }, $value );
}
elsif ( ref $top->[0] eq 'REF' ) {
${ $top->[0] } = $value;
}
else {
die
"Unexpected reference type in _macrowave @$top; expected HASH, ARRAY, or REF\n";
}
}
push( @stack, $newref ) if $newref;
# pop all completed elements
while ( @stack && $stack[-1]->[1] == 0 ) {
$value = $stack[-1]->[0];
pop(@stack);
}
# if the top one is hash, process next key
if ( @stack && $stack[-1]->[1] > 0 && ref $stack[-1]->[0] eq 'HASH' )
{
my $key_name_len = unpack 'N', substr( $frozen, $pos, 4 );
$stack[-1]->[2] = substr( $frozen, $pos + 4, $key_name_len );
$pos += 4 + $key_name_len;
}
last if !@stack; # if nothing on the stack, we're done here
} ## end while ( $pos < $len )
return $value;
} ## end sub _macrowave
sub _thaw_mt_2 { # MT
my ($frozen) = @_;
return unless substr( $frozen, 0, 4 ) eq 'SERG';
my $thawed;
my $pos = 12; # skips past signature and version block
# The microwave thaws and pops out an element
$thawed = _macrowave( $frozen, $pos );
$thawed = {} unless defined $thawed;
\$thawed;
}
sub _thaw_mt_3 { # Storable
my ($frozen) = @_;
return unless substr( $frozen, 0, 4 ) eq 'SERG';
my $thawed;
my $pos = 12; # skips past signature and version block
require Storable;
$thawed = Storable::thaw( substr( $frozen, $pos ) );
$thawed = {} unless defined $thawed;
\$thawed;
}
sub _thaw_mt_4 { # JSON
my ($frozen) = @_;
return unless substr( $frozen, 0, 4 ) eq 'SERG';
my $thawed;
my $pos = 12; # skips past signature and version block
require JSON;
$thawed = JSON::decode_json( substr( $frozen, $pos ) );
$thawed = {} unless defined $thawed;
\$thawed;
}
1;
__END__
=head1 NAME
MT::Serialize - Data serialization library
=head1 SYNOPSIS
my $serializer = MT::Serialize->new(MT->config->Serializer);
my $data = { 'this' => 'is', 'my' => 'data' };
my $frozen = $serializer->serialize( \$data );
my $thawed = $serializer->unserialize( $frozen );
=head1 DESCRIPTION
This package provides an abstraction layer to the serialization methods that
are available to Movable Type. The user can select the type of serialization
they want to use by specifying it in the mt.cfg file with the 'Serializer'
configuration key. 'MT' and 'Storable' are the currently available
serialization methods.
=head1 USAGE
=head2 MT::Serialize::new( $type )
Constructor that returns an object with methods that are appropriate for
the I<$type> of serialization requested.
=head2 MT::Serialize->serialize( $data )
Converts the data given into a bytestream, suitable for storage in a
BerkeleyDB table, a BLOB field in a database or a flat file.
Note that the $data parameter must be a reference to whatever data you
want to serialize. For instance, if you are serializing a hashref, you
should pass through a reference to the hashref.
=head2 MT::Serialize->unserialize( $data )
Converts a serialized bytestream given back into the original Perl data
structure. It returns a reference to whatever data structure was
reconstructed.
=head2 no_utf8
This function removes UTF-8 from scalars.
=head1 COMPATIBILITY NOTES
Version 2 of the native MT serializer changes the structure of the
stream quite a bit, but remains backward compatible. If version 1
frozen data is fed into the MT thaw method, it will handle it using
the legacy code. Then upon reserializing the data, it will be
upgraded to the new format. The new encoding includes a version
number which should allow us more flexibility in upgrading the
encoding format in the future, without worrying about breaking or
upgrading existing serialized data.
The updated protocol allows you to store most any Perl data structure,
although it does not currently support references to objects, code
references or globs.
=cut