refactor python reader to take a get_bytes function; add reader tests [#38]

This commit is contained in:
Brandon Liu
2022-04-26 16:15:03 +08:00
parent adb6f896a3
commit 3944d27833
4 changed files with 79 additions and 39 deletions

View File

@@ -3,20 +3,26 @@ import mmap
from contextlib import contextmanager
@contextmanager
def read(fname):
r = Reader(fname)
try:
yield r
finally:
r.close()
def MmapSource(f):
mapping = mmap.mmap(f.fileno(), 0)
def get_bytes(offset, length):
return mapping[offset : offset + length]
return get_bytes
def MemorySource(buf):
def get_bytes(offset, length):
return buf[offset : offset + length]
return get_bytes
class Reader:
def __init__(self, fname):
self.f = open(fname, "r+b")
self.mmap = mmap.mmap(self.f.fileno(), 0)
assert int.from_bytes(self.mmap[0:2], byteorder="little") == 0x4D50
def __init__(self, get_bytes):
self.get_bytes = get_bytes
assert int.from_bytes(self.get_bytes(0, 2), byteorder="little") == 0x4D50
first_entry_idx = 10 + self.metadata_len
self.root_dir, self.leaves = self.load_directory(
first_entry_idx, self.root_entries
@@ -26,11 +32,11 @@ class Reader:
directory = {}
leaves = {}
for i in range(offset, offset + num_entries * 17, 17):
z = int.from_bytes(self.mmap[i : i + 1], byteorder="little")
x = int.from_bytes(self.mmap[i + 1 : i + 4], byteorder="little")
y = int.from_bytes(self.mmap[i + 4 : i + 7], byteorder="little")
tile_off = int.from_bytes(self.mmap[i + 7 : i + 13], byteorder="little")
tile_len = int.from_bytes(self.mmap[i + 13 : i + 17], byteorder="little")
z = int.from_bytes(self.get_bytes(i, 1), byteorder="little")
x = int.from_bytes(self.get_bytes(i + 1, 3), byteorder="little")
y = int.from_bytes(self.get_bytes(i + 4, 3), byteorder="little")
tile_off = int.from_bytes(self.get_bytes(i + 7, 6), byteorder="little")
tile_len = int.from_bytes(self.get_bytes(i + 13, 4), byteorder="little")
if z & 0b10000000:
leaves[(z & 0b01111111, x, y)] = (tile_off, tile_len)
else:
@@ -42,20 +48,20 @@ class Reader:
@property
def metadata_len(self):
return int.from_bytes(self.mmap[4:8], byteorder="little")
return int.from_bytes(self.get_bytes(4, 4), byteorder="little")
@property
def metadata(self):
s = self.mmap[10 : 10 + self.metadata_len]
s = self.get_bytes(10, self.metadata_len)
return json.loads(s)
@property
def version(self):
return int.from_bytes(self.mmap[2:4], byteorder="little")
return int.from_bytes(self.get_bytes(2, 2), byteorder="little")
@property
def root_entries(self):
return int.from_bytes(self.mmap[8:10], byteorder="little")
return int.from_bytes(self.get_bytes(8, 2), byteorder="little")
@property
def leaf_level(self):
@@ -64,7 +70,7 @@ class Reader:
def get(self, z, x, y):
val = self.root_dir.get((z, x, y))
if val:
return self.mmap[val[0] : val[0] + val[1]]
return self.get_bytes(val[0], val[1])
else:
if len(self.leaves) > 0:
level_diff = z - self.leaf_level
@@ -74,12 +80,12 @@ class Reader:
directory, _ = self.load_directory(val[0], val[1] // 17)
val = directory.get((z, x, y))
if val:
return self.mmap[val[0] : val[0] + val[1]]
return self.get_bytes(val[0], val[1])
def tiles(self):
for k, v in self.root_dir.items():
yield (k, self.mmap[v[0] : v[0] + v[1]])
yield (k, self.get_bytes(v[0], v[1]))
for val in self.leaves.values():
leaf_dir, _ = self.load_directory(val[0], val[1] // 17)
for k, v in leaf_dir.items():
yield (k, self.mmap[v[0] : v[0] + v[1]])
yield (k, self.get_bytes(v[0], v[1]))