ucftools/matlab/+msgpack/parsemsgpack.m

195 lines
6.5 KiB
Matlab

%PARSEMSGPACK parses a msgpack byte buffer into Matlab data structures
% PARSEMSGPACK(BYTES)
% reads BYTES as msgpack data, and creates Matlab data structures
% from it. The number of bytes consumed by the parsemsgpack call
% is returned in the variable IDX.
% - strings are converted to strings
% - numbers are converted to appropriate numeric values
% - true, false are converted to logical 1, 0
% - nil is converted to []
% - arrays are converted to cell arrays
% - maps are converted to containers.Map
% (c) 2016 Bastian Bechtold
% This code is licensed under the BSD 3-clause license
function [obj, idx] = parsemsgpack(bytes)
[obj, idx] = parse(uint8(bytes(:)), 1);
end
function [obj, idx] = parse(bytes, idx)
% masks:
b10000000 = 128;
b01111111 = 127;
b11000000 = 192;
b00111111 = 63;
b11100000 = 224;
b00011111 = 31;
b11110000 = 240;
b00001111 = 15;
% values:
b00000000 = 0;
b10010000 = 144;
b10100000 = 160;
currentbyte = bytes(idx);
if bitand(b10000000, currentbyte) == b00000000
% decode positive fixint
obj = int8(currentbyte);
idx = idx + 1;
return
elseif bitand(b11100000, currentbyte) == b11100000
% decode negative fixint
obj = typecast(currentbyte, 'int8');
idx = idx + 1;
return
elseif bitand(b11110000, currentbyte) == b10000000
% decode fixmap
len = double(bitand(b00001111, currentbyte));
[obj, idx] = parsemap(len, bytes, idx+1);
return
elseif bitand(b11110000, currentbyte) == b10010000
% decode fixarray
len = double(bitand(b00001111, currentbyte));
[obj, idx] = parsearray(len, bytes, idx+1);
return
elseif bitand(b11100000, currentbyte) == b10100000
% decode fixstr
len = double(bitand(b00011111, currentbyte));
[obj, idx] = parsestring(len, bytes, idx + 1);
return
end
switch currentbyte
case 192 % nil
obj = [];
idx = idx+1;
% case 193 % unused
case 194 % false
obj = false;
idx = idx+1;
case 195 % true
obj = true;
idx = idx+1;
case 196 % bin8
len = double(bytes(idx+1));
[obj, idx] = parsebytes(len, bytes, idx+2);
case 197 % bin16
len = double(bytes2scalar(bytes(idx+1:idx+2), 'uint16'));
[obj, idx] = parsebytes(len, bytes, idx+3);
case 198 % bin32
len = double(bytes2scalar(bytes(idx+1:idx+4), 'uint32'));
[obj, idx] = parsebytes(len, bytes, idx+5);
case 199 % ext8
len = double(bytes(idx+1));
[obj, idx] = parseext(len, bytes, idx+2);
case 200 % ext16
len = double(bytes2scalar(bytes(idx+1:idx+2), 'uint16'));
[obj, idx] = parseext(len, bytes, idx+3);
case 201 % ext32
len = double(bytes2scalar(bytes(idx+1:idx+4), 'uint32'));
[obj, idx] = parseext(len, bytes, idx+5);
case 202 % float32
obj = bytes2scalar(bytes(idx+1:idx+4), 'single');
idx = idx+5;
case 203 % float64
obj = bytes2scalar(bytes(idx+1:idx+8), 'double');
idx = idx+9;
case 204 % uint8
obj = bytes(idx+1);
idx = idx+2;
case 205 % uint16
obj = bytes2scalar(bytes(idx+1:idx+2), 'uint16');
idx = idx+3;
case 206 % uint32
obj = bytes2scalar(bytes(idx+1:idx+4), 'uint32');
idx = idx+5;
case 207 % uint64
obj = bytes2scalar(bytes(idx+1:idx+8), 'uint64');
idx = idx+9;
case 208 % int8
obj = bytes2scalar(bytes(idx+1), 'int8');
idx = idx+2;
case 209 % int16
obj = bytes2scalar(bytes(idx+1:idx+2), 'int16');
idx = idx+3;
case 210 % int32
obj = bytes2scalar(bytes(idx+1:idx+4), 'int32');
idx = idx+5;
case 211 % int64
obj = bytes2scalar(bytes(idx+1:idx+8), 'int64');
idx = idx+9;
case 212 % fixext1
[obj, idx] = parseext(1, bytes, idx+1);
case 213 % fixext2
[obj, idx] = parseext(2, bytes, idx+1);
case 214 % fixext4
[obj, idx] = parseext(4, bytes, idx+1);
case 215 % fixext8
[obj, idx] = parseext(8, bytes, idx+1);
case 216 % fixext16
[obj, idx] = parseext(16, bytes, idx+1);
case 217 % str8
len = double(bytes(idx+1));
[obj, idx] = parsestring(len, bytes, idx+2);
case 218 % str16
len = double(bytes2scalar(bytes(idx+1:idx+2), 'uint16'));
[obj, idx] = parsestring(len, bytes, idx+3);
case 219 % str32
len = double(bytes2scalar(bytes(idx+1:idx+4), 'uint32'));
[obj, idx] = parsestring(len, bytes, idx+5);
case 220 % array16
len = double(bytes2scalar(bytes(idx+1:idx+2), 'uint16'));
[obj, idx] = parsearray(len, bytes, idx+3);
case 221 % array32
len = double(bytes2scalar(bytes(idx+1:idx+4), 'uint32'));
[obj, idx] = parsearray(len, bytes, idx+5);
case 222 % map16
len = double(bytes2scalar(bytes(idx+1:idx+2), 'uint16'));
[obj, idx] = parsemap(len, bytes, idx+3);
case 223 % map32
len = double(bytes2scalar(bytes(idx+1:idx+4), 'uint32'));
[obj, idx] = parsemap(len, bytes, idx+5);
otherwise
error('transplant:parsemsgpack:unknowntype', ...
['Unknown type "' dec2bin(currentbyte) '"']);
end
end
function value = bytes2scalar(bytes, type)
% reverse byte order to convert from little-endian to big-endian
value = typecast(bytes(end:-1:1), type);
end
function [str, idx] = parsestring(len, bytes, idx)
str = native2unicode(bytes(idx:idx+len-1)', 'utf-8');
idx = idx + len;
end
function [out, idx] = parsebytes(len, bytes, idx)
out = bytes(idx:idx+len-1);
idx = idx + len;
end
function [out, idx] = parseext(len, bytes, idx)
out.type = bytes(idx);
out.data = bytes(idx+1:idx+len);
idx = idx + len + 1;
end
function [out, idx] = parsearray(len, bytes, idx)
out = cell(1, len);
for n=1:len
[out{n}, idx] = parse(bytes, idx);
end
end
function [out, idx] = parsemap(len, bytes, idx)
out = containers.Map();
for n=1:len
[key, idx] = parse(bytes, idx);
[out(key), idx] = parse(bytes, idx);
end
end