232 lines
7.0 KiB
Python
232 lines
7.0 KiB
Python
|
"""sstruct.py -- SuperStruct
|
||
|
|
||
|
Higher level layer on top of the struct module, enabling to
|
||
|
bind names to struct elements. The interface is similar to
|
||
|
struct, except the objects passed and returned are not tuples
|
||
|
(or argument lists), but dictionaries or instances.
|
||
|
|
||
|
Just like struct, we use fmt strings to describe a data
|
||
|
structure, except we use one line per element. Lines are
|
||
|
separated by newlines or semi-colons. Each line contains
|
||
|
either one of the special struct characters ('@', '=', '<',
|
||
|
'>' or '!') or a 'name:formatchar' combo (eg. 'myFloat:f').
|
||
|
Repetitions, like the struct module offers them are not useful
|
||
|
in this context, except for fixed length strings (eg. 'myInt:5h'
|
||
|
is not allowed but 'myString:5s' is). The 'x' fmt character
|
||
|
(pad byte) is treated as 'special', since it is by definition
|
||
|
anonymous. Extra whitespace is allowed everywhere.
|
||
|
|
||
|
The sstruct module offers one feature that the "normal" struct
|
||
|
module doesn't: support for fixed point numbers. These are spelled
|
||
|
as "n.mF", where n is the number of bits before the point, and m
|
||
|
the number of bits after the point. Fixed point numbers get
|
||
|
converted to floats.
|
||
|
|
||
|
pack(fmt, object):
|
||
|
'object' is either a dictionary or an instance (or actually
|
||
|
anything that has a __dict__ attribute). If it is a dictionary,
|
||
|
its keys are used for names. If it is an instance, it's
|
||
|
attributes are used to grab struct elements from. Returns
|
||
|
a string containing the data.
|
||
|
|
||
|
unpack(fmt, data, object=None)
|
||
|
If 'object' is omitted (or None), a new dictionary will be
|
||
|
returned. If 'object' is a dictionary, it will be used to add
|
||
|
struct elements to. If it is an instance (or in fact anything
|
||
|
that has a __dict__ attribute), an attribute will be added for
|
||
|
each struct element. In the latter two cases, 'object' itself
|
||
|
is returned.
|
||
|
|
||
|
unpack2(fmt, data, object=None)
|
||
|
Convenience function. Same as unpack, except data may be longer
|
||
|
than needed. The returned value is a tuple: (object, leftoverdata).
|
||
|
|
||
|
calcsize(fmt)
|
||
|
like struct.calcsize(), but uses our own fmt strings:
|
||
|
it returns the size of the data in bytes.
|
||
|
"""
|
||
|
|
||
|
from fontTools.misc.fixedTools import fixedToFloat as fi2fl, floatToFixed as fl2fi
|
||
|
from fontTools.misc.textTools import tobytes, tostr
|
||
|
import struct
|
||
|
import re
|
||
|
|
||
|
__version__ = "1.2"
|
||
|
__copyright__ = "Copyright 1998, Just van Rossum <just@letterror.com>"
|
||
|
|
||
|
|
||
|
class Error(Exception):
|
||
|
pass
|
||
|
|
||
|
|
||
|
def pack(fmt, obj):
|
||
|
formatstring, names, fixes = getformat(fmt, keep_pad_byte=True)
|
||
|
elements = []
|
||
|
if not isinstance(obj, dict):
|
||
|
obj = obj.__dict__
|
||
|
string_index = formatstring
|
||
|
if formatstring.startswith(">"):
|
||
|
string_index = formatstring[1:]
|
||
|
for ix, name in enumerate(names.keys()):
|
||
|
value = obj[name]
|
||
|
if name in fixes:
|
||
|
# fixed point conversion
|
||
|
value = fl2fi(value, fixes[name])
|
||
|
elif isinstance(value, str):
|
||
|
value = tobytes(value)
|
||
|
elements.append(value)
|
||
|
# Check it fits
|
||
|
try:
|
||
|
struct.pack(names[name], value)
|
||
|
except Exception as e:
|
||
|
raise ValueError(
|
||
|
"Value %s does not fit in format %s for %s" % (value, names[name], name)
|
||
|
) from e
|
||
|
data = struct.pack(*(formatstring,) + tuple(elements))
|
||
|
return data
|
||
|
|
||
|
|
||
|
def unpack(fmt, data, obj=None):
|
||
|
if obj is None:
|
||
|
obj = {}
|
||
|
data = tobytes(data)
|
||
|
formatstring, names, fixes = getformat(fmt)
|
||
|
if isinstance(obj, dict):
|
||
|
d = obj
|
||
|
else:
|
||
|
d = obj.__dict__
|
||
|
elements = struct.unpack(formatstring, data)
|
||
|
for i in range(len(names)):
|
||
|
name = list(names.keys())[i]
|
||
|
value = elements[i]
|
||
|
if name in fixes:
|
||
|
# fixed point conversion
|
||
|
value = fi2fl(value, fixes[name])
|
||
|
elif isinstance(value, bytes):
|
||
|
try:
|
||
|
value = tostr(value)
|
||
|
except UnicodeDecodeError:
|
||
|
pass
|
||
|
d[name] = value
|
||
|
return obj
|
||
|
|
||
|
|
||
|
def unpack2(fmt, data, obj=None):
|
||
|
length = calcsize(fmt)
|
||
|
return unpack(fmt, data[:length], obj), data[length:]
|
||
|
|
||
|
|
||
|
def calcsize(fmt):
|
||
|
formatstring, names, fixes = getformat(fmt)
|
||
|
return struct.calcsize(formatstring)
|
||
|
|
||
|
|
||
|
# matches "name:formatchar" (whitespace is allowed)
|
||
|
_elementRE = re.compile(
|
||
|
r"\s*" # whitespace
|
||
|
r"([A-Za-z_][A-Za-z_0-9]*)" # name (python identifier)
|
||
|
r"\s*:\s*" # whitespace : whitespace
|
||
|
r"([xcbB?hHiIlLqQfd]|" # formatchar...
|
||
|
r"[0-9]+[ps]|" # ...formatchar...
|
||
|
r"([0-9]+)\.([0-9]+)(F))" # ...formatchar
|
||
|
r"\s*" # whitespace
|
||
|
r"(#.*)?$" # [comment] + end of string
|
||
|
)
|
||
|
|
||
|
# matches the special struct fmt chars and 'x' (pad byte)
|
||
|
_extraRE = re.compile(r"\s*([x@=<>!])\s*(#.*)?$")
|
||
|
|
||
|
# matches an "empty" string, possibly containing whitespace and/or a comment
|
||
|
_emptyRE = re.compile(r"\s*(#.*)?$")
|
||
|
|
||
|
_fixedpointmappings = {8: "b", 16: "h", 32: "l"}
|
||
|
|
||
|
_formatcache = {}
|
||
|
|
||
|
|
||
|
def getformat(fmt, keep_pad_byte=False):
|
||
|
fmt = tostr(fmt, encoding="ascii")
|
||
|
try:
|
||
|
formatstring, names, fixes = _formatcache[fmt]
|
||
|
except KeyError:
|
||
|
lines = re.split("[\n;]", fmt)
|
||
|
formatstring = ""
|
||
|
names = {}
|
||
|
fixes = {}
|
||
|
for line in lines:
|
||
|
if _emptyRE.match(line):
|
||
|
continue
|
||
|
m = _extraRE.match(line)
|
||
|
if m:
|
||
|
formatchar = m.group(1)
|
||
|
if formatchar != "x" and formatstring:
|
||
|
raise Error("a special fmt char must be first")
|
||
|
else:
|
||
|
m = _elementRE.match(line)
|
||
|
if not m:
|
||
|
raise Error("syntax error in fmt: '%s'" % line)
|
||
|
name = m.group(1)
|
||
|
formatchar = m.group(2)
|
||
|
if keep_pad_byte or formatchar != "x":
|
||
|
names[name] = formatchar
|
||
|
if m.group(3):
|
||
|
# fixed point
|
||
|
before = int(m.group(3))
|
||
|
after = int(m.group(4))
|
||
|
bits = before + after
|
||
|
if bits not in [8, 16, 32]:
|
||
|
raise Error("fixed point must be 8, 16 or 32 bits long")
|
||
|
formatchar = _fixedpointmappings[bits]
|
||
|
names[name] = formatchar
|
||
|
assert m.group(5) == "F"
|
||
|
fixes[name] = after
|
||
|
formatstring += formatchar
|
||
|
_formatcache[fmt] = formatstring, names, fixes
|
||
|
return formatstring, names, fixes
|
||
|
|
||
|
|
||
|
def _test():
|
||
|
fmt = """
|
||
|
# comments are allowed
|
||
|
> # big endian (see documentation for struct)
|
||
|
# empty lines are allowed:
|
||
|
|
||
|
ashort: h
|
||
|
along: l
|
||
|
abyte: b # a byte
|
||
|
achar: c
|
||
|
astr: 5s
|
||
|
afloat: f; adouble: d # multiple "statements" are allowed
|
||
|
afixed: 16.16F
|
||
|
abool: ?
|
||
|
apad: x
|
||
|
"""
|
||
|
|
||
|
print("size:", calcsize(fmt))
|
||
|
|
||
|
class foo(object):
|
||
|
pass
|
||
|
|
||
|
i = foo()
|
||
|
|
||
|
i.ashort = 0x7FFF
|
||
|
i.along = 0x7FFFFFFF
|
||
|
i.abyte = 0x7F
|
||
|
i.achar = "a"
|
||
|
i.astr = "12345"
|
||
|
i.afloat = 0.5
|
||
|
i.adouble = 0.5
|
||
|
i.afixed = 1.5
|
||
|
i.abool = True
|
||
|
|
||
|
data = pack(fmt, i)
|
||
|
print("data:", repr(data))
|
||
|
print(unpack(fmt, data))
|
||
|
i2 = foo()
|
||
|
unpack(fmt, data, i2)
|
||
|
print(vars(i2))
|
||
|
|
||
|
|
||
|
if __name__ == "__main__":
|
||
|
_test()
|