littlefs/scripts/dbglfs.py

#!/usr/bin/env python3

import bisect
import collections as co
import functools as ft
import itertools as it
import math as m
import os
import struct


TAG_NULL            = 0x0000
TAG_CONFIG          = 0x0000
TAG_MAGIC           = 0x0003
TAG_VERSION         = 0x0004
TAG_RCOMPAT         = 0x0005
TAG_WCOMPAT         = 0x0006
TAG_OCOMPAT         = 0x0007
TAG_GEOMETRY        = 0x0009
TAG_NAMELIMIT       = 0x000c
TAG_SIZELIMIT       = 0x000d
TAG_GDELTA          = 0x0100
TAG_GRMDELTA        = 0x0100
TAG_NAME            = 0x0200
TAG_REG             = 0x0201
TAG_DIR             = 0x0202
TAG_ORPHAN          = 0x0203
TAG_BOOKMARK        = 0x0204
TAG_STRUCT          = 0x0300
TAG_DATA            = 0x0300
TAG_BLOCK           = 0x0304
TAG_BSHRUB          = 0x0308
TAG_BTREE           = 0x030c
TAG_DID             = 0x0310
TAG_BECKSUM         = 0x0314
TAG_BRANCH          = 0x031c
TAG_MROOT           = 0x0321
TAG_MDIR            = 0x0325
TAG_MTREE           = 0x032c
TAG_UATTR           = 0x0400
TAG_SATTR           = 0x0600
TAG_SHRUB           = 0x1000
TAG_CKSUM           = 0x3000
TAG_ECKSUM          = 0x3100
TAG_ALT             = 0x4000
TAG_GT              = 0x2000
TAG_R               = 0x1000


# some ways of block geometry representations
# 512      -> 512
# 512x16   -> (512, 16)
# 0x200x10 -> (512, 16)
def bdgeom(s):
    s = s.strip()
    b = 10
    if s.startswith('0x') or s.startswith('0X'):
        s = s[2:]
        b = 16
    elif s.startswith('0o') or s.startswith('0O'):
        s = s[2:]
        b = 8
    elif s.startswith('0b') or s.startswith('0B'):
        s = s[2:]
        b = 2

    if 'x' in s:
        s, s_ = s.split('x', 1)
        return (int(s, b), int(s_, b))
    else:
        return int(s, b)

# parse some rbyd addr encodings
# 0xa       -> [0xa]
# 0xa.c     -> [(0xa, 0xc)]
# 0x{a,b}   -> [0xa, 0xb]
# 0x{a,b}.c -> [(0xa, 0xc), (0xb, 0xc)]
def rbydaddr(s):
    s = s.strip()
    b = 10
    if s.startswith('0x') or s.startswith('0X'):
        s = s[2:]
        b = 16
    elif s.startswith('0o') or s.startswith('0O'):
        s = s[2:]
        b = 8
    elif s.startswith('0b') or s.startswith('0B'):
        s = s[2:]
        b = 2

    trunk = None
    if '.' in s:
        s, s_ = s.split('.', 1)
        trunk = int(s_, b)

    if s.startswith('{') and '}' in s:
        ss = s[1:s.find('}')].split(',')
    else:
        ss = [s]

    addr = []
    for s in ss:
        if trunk is not None:
            addr.append((int(s, b), trunk))
        else:
            addr.append(int(s, b))

    return addr

def crc32c(data, crc=0):
    crc ^= 0xffffffff
    for b in data:
        crc ^= b
        for j in range(8):
            crc = (crc >> 1) ^ ((crc & 1) * 0x82f63b78)
    return 0xffffffff ^ crc

def popc(x):
    return bin(x).count('1')

def fromle32(data):
    return struct.unpack('<I', data[0:4].ljust(4, b'\0'))[0]

def fromleb128(data):
    word = 0
    for i, b in enumerate(data):
        word |= ((b & 0x7f) << 7*i)
        word &= 0xffffffff
        if not b & 0x80:
            return word, i+1
    return word, len(data)

def fromtag(data):
    data = data.ljust(4, b'\0')
    tag = (data[0] << 8) | data[1]
    weight, d = fromleb128(data[2:])
    size, d_ = fromleb128(data[2+d:])
    return tag>>15, tag&0x7fff, weight, size, 2+d+d_

def frommdir(data):
    blocks = []
    d = 0
    while d < len(data):
        block, d_ = fromleb128(data[d:])
        blocks.append(block)
        d += d_
    return blocks

def fromshrub(data):
    d = 0
    weight, d_ = fromleb128(data[d:]); d += d_
    trunk, d_ = fromleb128(data[d:]); d += d_
    return weight, trunk

def frombranch(data):
    d = 0
    block, d_ = fromleb128(data[d:]); d += d_
    trunk, d_ = fromleb128(data[d:]); d += d_
    cksum = fromle32(data[d:]); d += 4
    return block, trunk, cksum

def frombtree(data):
    d = 0
    w, d_ = fromleb128(data[d:]); d += d_
    block, trunk, cksum = frombranch(data[d:])
    return w, block, trunk, cksum

def frombptr(data):
    d = 0
    size, d_ = fromleb128(data[d:]); d += d_
    block, d_ = fromleb128(data[d:]); d += d_
    off, d_ = fromleb128(data[d:]); d += d_
    cksize, d_ = fromleb128(data[d:]); d += d_
    cksum = fromle32(data[d:]); d += 4
    return size, block, off, cksize, cksum

def xxd(data, width=16):
    for i in range(0, len(data), width):
        yield '%-*s %-*s' % (
            3*width,
            ' '.join('%02x' % b for b in data[i:i+width]),
            width,
            ''.join(
                b if b >= ' ' and b <= '~' else '.'
                for b in map(chr, data[i:i+width])))

def tagrepr(tag, w, size, off=None):
    if (tag & 0xefff) == TAG_NULL:
        return '%snull%s%s' % (
            'shrub' if tag & TAG_SHRUB else '',
            ' w%d' % w if w else '',
            ' %d' % size if size else '')
    elif (tag & 0xef00) == TAG_CONFIG:
        return '%s%s%s %d' % (
            'shrub' if tag & TAG_SHRUB else '',
            'magic' if (tag & 0xfff) == TAG_MAGIC
                else 'version' if (tag & 0xfff) == TAG_VERSION
                else 'rcompat' if (tag & 0xfff) == TAG_RCOMPAT
                else 'wcompat' if (tag & 0xfff) == TAG_WCOMPAT
                else 'ocompat' if (tag & 0xfff) == TAG_OCOMPAT
                else 'geometry' if (tag & 0xfff) == TAG_GEOMETRY
                else 'sizelimit' if (tag & 0xfff) == TAG_SIZELIMIT
                else 'namelimit' if (tag & 0xfff) == TAG_NAMELIMIT
                else 'config 0x%02x' % (tag & 0xff),
            ' w%d' % w if w else '',
            size)
    elif (tag & 0xef00) == TAG_GDELTA:
        return '%s%s%s %d' % (
            'shrub' if tag & TAG_SHRUB else '',
            'grmdelta' if (tag & 0xfff) == TAG_GRMDELTA
                else 'gdelta 0x%02x' % (tag & 0xff),
            ' w%d' % w if w else '',
            size)
    elif (tag & 0xef00) == TAG_NAME:
        return '%s%s%s %d' % (
            'shrub' if tag & TAG_SHRUB else '',
            'name' if (tag & 0xfff) == TAG_NAME
                else 'reg' if (tag & 0xfff) == TAG_REG
                else 'dir' if (tag & 0xfff) == TAG_DIR
                else 'orphan' if (tag & 0xfff) == TAG_ORPHAN
                else 'bookmark' if (tag & 0xfff) == TAG_BOOKMARK
                else 'name 0x%02x' % (tag & 0xff),
            ' w%d' % w if w else '',
            size)
    elif (tag & 0xef00) == TAG_STRUCT:
        return '%s%s%s %d' % (
            'shrub' if tag & TAG_SHRUB else '',
            'data' if (tag & 0xfff) == TAG_DATA
                else 'block' if (tag & 0xfff) == TAG_BLOCK
                else 'bshrub' if (tag & 0xfff) == TAG_BSHRUB
                else 'btree' if (tag & 0xfff) == TAG_BTREE
                else 'did' if (tag & 0xfff) == TAG_DID
                else 'becksum' if (tag & 0xfff) == TAG_BECKSUM
                else 'branch' if (tag & 0xfff) == TAG_BRANCH
                else 'mroot' if (tag & 0xfff) == TAG_MROOT
                else 'mdir' if (tag & 0xfff) == TAG_MDIR
                else 'mtree' if (tag & 0xfff) == TAG_MTREE
                else 'struct 0x%02x' % (tag & 0xff),
            ' w%d' % w if w else '',
            size)
    elif (tag & 0xef00) == TAG_UATTR:
        return '%suattr 0x%02x%s %d' % (
            'shrub' if tag & TAG_SHRUB else '',
            ((tag & 0x100) >> 1) | (tag & 0xff),
            ' w%d' % w if w else '',
            size)
    elif (tag & 0xef00) == TAG_SATTR:
        return '%ssattr 0x%02x%s %d' % (
            'shrub' if tag & TAG_SHRUB else '',
            ((tag & 0x100) >> 1) | (tag & 0xff),
            ' w%d' % w if w else '',
            size)
    elif (tag & 0xff00) == TAG_CKSUM:
        return 'cksum 0x%02x%s %d' % (
            tag & 0xff,
            ' w%d' % w if w > 0 else '',
            size)
    elif (tag & 0xff00) == TAG_ECKSUM:
        return 'ecksum%s%s %d' % (
            ' 0x%02x' % (tag & 0xff) if tag & 0xff else '',
            ' w%d' % w if w > 0 else '',
            size)
    elif tag & TAG_ALT:
        return 'alt%s%s%s w%d %s' % (
            'r' if tag & TAG_R else 'b',
            'a' if tag & 0x0fff == 0 and tag & TAG_GT
                else 'n' if tag & 0x0fff == 0
                else 'gt' if tag & TAG_GT
                else 'le',
            ' 0x%x' % (tag & 0x0fff) if tag & 0x0fff != 0 else '',
            w,
            '0x%x' % (0xffffffff & (off-size))
                if off is not None
                else '-%d' % off)
    else:
        return '0x%04x w%d %d' % (tag, w, size)


# this type is used for tree representations
TBranch = co.namedtuple('TBranch', 'a, b, d, c')

# our core rbyd type
class Rbyd:
    def __init__(self, block, data, rev, eoff, trunk, weight):
        self.block = block
        self.data = data
        self.rev = rev
        self.eoff = eoff
        self.trunk = trunk
        self.weight = weight
        self.redund_blocks = []

    def addr(self):
        if not self.redund_blocks:
            return '0x%x.%x' % (self.block, self.trunk)
        else:
            return '0x{%x,%s}.%x' % (
                self.block,
                ','.join('%x' % block for block in self.redund_blocks),
                self.trunk)

    @classmethod
    def fetch(cls, f, block_size, blocks, trunk=None):
        if isinstance(blocks, int):
            blocks = [blocks]

        if len(blocks) > 1:
            # fetch all blocks
            rbyds = [cls.fetch(f, block_size, block, trunk) for block in blocks]
            # determine most recent revision
            i = 0
            for i_, rbyd in enumerate(rbyds):
                # compare with sequence arithmetic
                if rbyd and (
                        not rbyds[i]
                        or not ((rbyd.rev - rbyds[i].rev) & 0x80000000)
                        or (rbyd.rev == rbyds[i].rev
                            and rbyd.trunk > rbyds[i].trunk)):
                    i = i_
            # keep track of the other blocks
            rbyd = rbyds[i]
            rbyd.redund_blocks = [rbyds[(i+1+j) % len(rbyds)].block
                for j in range(len(rbyds)-1)]
            return rbyd
        else:
            # block may encode a trunk
            block = blocks[0]
            if isinstance(block, tuple):
                if trunk is None:
                    trunk = block[1]
                block = block[0]

        # seek to the block
        f.seek(block * block_size)
        data = f.read(block_size)

        # fetch the rbyd
        rev = fromle32(data[0:4])
        cksum = 0
        cksum_ = crc32c(data[0:4])
        eoff = 0
        j_ = 4
        trunk_ = 0
        trunk__ = 0
        trunk___ = 0
        weight = 0
        weight_ = 0
        weight__ = 0
        wastrunk = False
        trunkeoff = None
        while j_ < len(data) and (not trunk or eoff <= trunk):
            v, tag, w, size, d = fromtag(data[j_:])
            if v != (popc(cksum_) & 1):
                break
            cksum_ = crc32c(data[j_:j_+d], cksum_)
            j_ += d
            if not tag & TAG_ALT and j_ + size > len(data):
                break

            # take care of cksums
            if not tag & TAG_ALT:
                if (tag & 0xff00) != TAG_CKSUM:
                    cksum_ = crc32c(data[j_:j_+size], cksum_)
                # found a cksum?
                else:
                    cksum__ = fromle32(data[j_:j_+4])
                    if cksum_ != cksum__:
                        break
                    # commit what we have
                    eoff = trunkeoff if trunkeoff else j_ + size
                    cksum = cksum_
                    trunk_ = trunk__
                    weight = weight_

            # evaluate trunks
            if (tag & 0xf000) != TAG_CKSUM and (
                    not trunk or trunk >= j_-d or wastrunk):
                # new trunk?
                if not wastrunk:
                    wastrunk = True
                    trunk___ = j_-d
                    weight__ = 0

                # keep track of weight
                weight__ += w

                # end of trunk?
                if not tag & TAG_ALT:
                    wastrunk = False
                    # update trunk/weight unless we found a shrub or an
                    # explicit trunk (which may be a shrub) is requested
                    if not tag & TAG_SHRUB or trunk:
                        trunk__ = trunk___
                        weight_ = weight__
                        # keep track of eoff for best matching trunk
                        if trunk and j_ + size > trunk:
                            trunkeoff = j_ + size
                            eoff = trunkeoff
                            cksum = cksum_
                            trunk_ = trunk__
                            weight = weight_

            if not tag & TAG_ALT:
                j_ += size

        return cls(block, data, rev, eoff, trunk_, weight)

    def lookup(self, rid, tag):
        if not self:
            return True, 0, -1, 0, 0, 0, b'', []

        tag = max(tag, 0x1)
        lower = 0
        upper = self.weight
        path = []

        # descend down tree
        j = self.trunk
        while True:
            _, alt, weight_, jump, d = fromtag(self.data[j:])

            # found an alt?
            if alt & TAG_ALT:
                # follow?
                if ((rid, tag & 0xfff) > (upper-weight_-1, alt & 0xfff)
                        if alt & TAG_GT
                        else ((rid, tag & 0xfff)
                            <= (lower+weight_-1, alt & 0xfff))):
                    lower += upper-lower-weight_ if alt & TAG_GT else 0
                    upper -= upper-lower-weight_ if not alt & TAG_GT else 0
                    j = j - jump

                    # figure out which color
                    if alt & TAG_R:
                        _, nalt, _, _, _ = fromtag(self.data[j+jump+d:])
                        if nalt & TAG_R:
                            path.append((j+jump, j, True, 'y'))
                        else:
                            path.append((j+jump, j, True, 'r'))
                    else:
                        path.append((j+jump, j, True, 'b'))

                # stay on path
                else:
                    lower += weight_ if not alt & TAG_GT else 0
                    upper -= weight_ if alt & TAG_GT else 0
                    j = j + d

                    # figure out which color
                    if alt & TAG_R:
                        _, nalt, _, _, _ = fromtag(self.data[j:])
                        if nalt & TAG_R:
                            path.append((j-d, j, False, 'y'))
                        else:
                            path.append((j-d, j, False, 'r'))
                    else:
                        path.append((j-d, j, False, 'b'))

            # found tag
            else:
                rid_ = upper-1
                tag_ = alt
                w_ = upper-lower

                done = not tag_ or (rid_, tag_) < (rid, tag)

                return done, rid_, tag_, w_, j, d, self.data[j+d:j+d+jump], path

    def __bool__(self):
        return bool(self.trunk)

    def __eq__(self, other):
        return self.block == other.block and self.trunk == other.trunk

    def __ne__(self, other):
        return not self.__eq__(other)

    def __iter__(self):
        tag = 0
        rid = -1

        while True:
            done, rid, tag, w, j, d, data, _ = self.lookup(rid, tag+0x1)
            if done:
                break

            yield rid, tag, w, j, d, data

    # create tree representation for debugging
    def tree(self):
        trunks = co.defaultdict(lambda: (-1, 0))
        alts = co.defaultdict(lambda: {})

        rid, tag = -1, 0
        while True:
            done, rid, tag, w, j, d, data, path = self.lookup(rid, tag+0x1)
            # found end of tree?
            if done:
                break

            # keep track of trunks/alts
            trunks[j] = (rid, tag)

            for j_, j__, followed, c in path:
                if followed:
                    alts[j_] |= {'f': j__, 'c': c}
                else:
                    alts[j_] |= {'nf': j__, 'c': c}

        # treat unreachable alts as converging paths
        for j_, alt in alts.items():
            if 'f' not in alt:
                alt['f'] = alt['nf']
            elif 'nf' not in alt:
                alt['nf'] = alt['f']

        # find the trunk and depth of each alt
        def rec_trunk(j_):
            if j_ not in alts:
                return trunks[j_]
            else:
                if 'nft' not in alts[j_]:
                    alts[j_]['nft'] = rec_trunk(alts[j_]['nf'])
                return alts[j_]['nft']

        for j_ in alts.keys():
            rec_trunk(j_)
        for j_, alt in alts.items():
            if alt['f'] in alts:
                alt['ft'] = alts[alt['f']]['nft']
            else:
                alt['ft'] = trunks[alt['f']]

        def rec_height(j_):
            if j_ not in alts:
                return 0
            else:
                if 'h' not in alts[j_]:
                    alts[j_]['h'] = max(
                        rec_height(alts[j_]['f']),
                        rec_height(alts[j_]['nf'])) + 1
                return alts[j_]['h']

        for j_ in alts.keys():
            rec_height(j_)

        t_depth = max((alt['h']+1 for alt in alts.values()), default=0)

        # convert to more general tree representation
        tree = set()
        for j, alt in alts.items():
            # note all non-trunk edges should be black
            tree.add(TBranch(
                a=alt['nft'],
                b=alt['nft'],
                d=t_depth-1 - alt['h'],
                c=alt['c'],
            ))
            tree.add(TBranch(
                a=alt['nft'],
                b=alt['ft'],
                d=t_depth-1 - alt['h'],
                c='b',
            ))

        return tree, t_depth

    # btree lookup with this rbyd as the root
    def btree_lookup(self, f, block_size, bid, *,
            depth=None):
        rbyd = self
        rid = bid
        depth_ = 1
        path = []

        # corrupted? return a corrupted block once
        if not rbyd:
            return bid > 0, bid, 0, rbyd, -1, [], path

        while True:
            # collect all tags, normally you don't need to do this
            # but we are debugging here
            name = None
            tags = []
            branch = None
            rid_ = rid
            tag = 0
            w = 0
            for i in it.count():
                done, rid__, tag, w_, j, d, data, _ = rbyd.lookup(
                    rid_, tag+0x1)
                if done or (i != 0 and rid__ != rid_):
                    break

                # first tag indicates the branch's weight
                if i == 0:
                    rid_, w = rid__, w_

                # catch any branches
                if tag & 0xfff == TAG_BRANCH:
                    branch = (tag, j, d, data)

                tags.append((tag, j, d, data))

            # keep track of path
            path.append((bid + (rid_-rid), w, rbyd, rid_, tags))

            # descend down branch?
            if branch is not None and (
                    not depth or depth_ < depth):
                tag, j, d, data = branch
                block, trunk, cksum = frombranch(data)
                rbyd = Rbyd.fetch(f, block_size, block, trunk)

                # corrupted? bail here so we can keep traversing the tree
                if not rbyd:
                    return False, bid + (rid_-rid), w, rbyd, -1, [], path

                rid -= (rid_-(w-1))
                depth_ += 1
            else:
                return not tags, bid + (rid_-rid), w, rbyd, rid_, tags, path

    # btree rbyd-tree generation for debugging
    def btree_tree(self, f, block_size, *,
            depth=None,
            inner=False):
        # find the max depth of each layer to nicely align trees
        bdepths = {}
        bid = -1
        while True:
            done, bid, w, rbyd, rid, tags, path = self.btree_lookup(
                f, block_size, bid+1, depth=depth)
            if done:
                break

            for d, (bid, w, rbyd, rid, tags) in enumerate(path):
                _, rdepth = rbyd.tree()
                bdepths[d] = max(bdepths.get(d, 0), rdepth)

        # find all branches
        tree = set()
        root = None
        branches = {}
        bid = -1
        while True:
            done, bid, w, rbyd, rid, tags, path = self.btree_lookup(
                f, block_size, bid+1, depth=depth)
            if done:
                break

            d_ = 0
            leaf = None
            for d, (bid, w, rbyd, rid, tags) in enumerate(path):
                if not tags:
                    continue

                # map rbyd tree into B-tree space
                rtree, rdepth = rbyd.tree()

                # note we adjust our bid/rids to be left-leaning,
                # this allows a global order and make tree rendering quite
                # a bit easier
                rtree_ = set()
                for branch in rtree:
                    a_rid, a_tag = branch.a
                    b_rid, b_tag = branch.b
                    _, _, _, a_w, _, _, _, _ = rbyd.lookup(a_rid, 0)
                    _, _, _, b_w, _, _, _, _ = rbyd.lookup(b_rid, 0)
                    rtree_.add(TBranch(
                        a=(a_rid-(a_w-1), a_tag),
                        b=(b_rid-(b_w-1), b_tag),
                        d=branch.d,
                        c=branch.c,
                    ))
                rtree = rtree_

                # connect our branch to the rbyd's root
                if leaf is not None:
                    root = min(rtree,
                        key=lambda branch: branch.d,
                        default=None)

                    if root is not None:
                        r_rid, r_tag = root.a
                    else:
                        r_rid, r_tag = rid-(w-1), tags[0][0]
                    tree.add(TBranch(
                        a=leaf,
                        b=(bid-rid+r_rid, d, r_rid, r_tag),
                        d=d_-1,
                        c='b',
                    ))

                for branch in rtree:
                    # map rbyd branches into our btree space
                    a_rid, a_tag = branch.a
                    b_rid, b_tag = branch.b
                    tree.add(TBranch(
                        a=(bid-rid+a_rid, d, a_rid, a_tag),
                        b=(bid-rid+b_rid, d, b_rid, b_tag),
                        d=branch.d + d_ + bdepths.get(d, 0)-rdepth,
                        c=branch.c,
                    ))

                d_ += max(bdepths.get(d, 0), 1)
                leaf = (bid-(w-1), d, rid-(w-1),
                    next((tag for tag, _, _, _ in tags
                            if tag & 0xfff == TAG_BRANCH),
                        TAG_BRANCH))

        # remap branches to leaves if we aren't showing inner branches
        if not inner:
            # step through each layer backwards
            b_depth = max((branch.a[1]+1 for branch in tree), default=0)

            # keep track of the original bids, unfortunately because we
            # store the bids in the branches we overwrite these
            tree = {(branch.b[0] - branch.b[2], branch) for branch in tree}

            for bd in reversed(range(b_depth-1)):
                # find leaf-roots at this level
                roots = {}
                for bid, branch in tree:
                    # choose the highest node as the root
                    if (branch.b[1] == b_depth-1
                            and (bid not in roots
                                or branch.d < roots[bid].d)):
                        roots[bid] = branch

                # remap branches to leaf-roots
                tree_ = set()
                for bid, branch in tree:
                    if branch.a[1] == bd and branch.a[0] in roots:
                        branch = TBranch(
                            a=roots[branch.a[0]].b,
                            b=branch.b,
                            d=branch.d,
                            c=branch.c,
                        )
                    if branch.b[1] == bd and branch.b[0] in roots:
                        branch = TBranch(
                            a=branch.a,
                            b=roots[branch.b[0]].b,
                            d=branch.d,
                            c=branch.c,
                        )
                    tree_.add((bid, branch))
                tree = tree_

            # strip out bids
            tree = {branch for _, branch in tree}

        return tree, max((branch.d+1 for branch in tree), default=0)

    # btree B-tree generation for debugging
    def btree_btree(self, f, block_size, *,
            depth=None,
            inner=False):
        # find all branches
        tree = set()
        root = None
        branches = {}
        bid = -1
        while True:
            done, bid, w, rbyd, rid, tags, path = self.btree_lookup(
                f, block_size, bid+1, depth=depth)
            if done:
                break

            # if we're not showing inner nodes, prefer names higher in
            # the tree since this avoids showing vestigial names
            name = None
            if not inner:
                name = None
                for bid_, w_, rbyd_, rid_, tags_ in reversed(path):
                    for tag_, j_, d_, data_ in tags_:
                        if tag_ & 0x7f00 == TAG_NAME:
                            name = (tag_, j_, d_, data_)

                    if rid_-(w_-1) != 0:
                        break

            a = root
            for d, (bid, w, rbyd, rid, tags) in enumerate(path):
                if not tags:
                    continue

                b = (bid-(w-1), d, rid-(w-1),
                    (name if name else tags[0])[0])

                # remap branches to leaves if we aren't showing
                # inner branches
                if not inner:
                    if b not in branches:
                        bid, w, rbyd, rid, tags = path[-1]
                        if not tags:
                            continue
                        branches[b] = (
                            bid-(w-1), len(path)-1, rid-(w-1),
                            (name if name else tags[0])[0])
                    b = branches[b]

                # found entry point?
                if root is None:
                    root = b
                    a = root

                tree.add(TBranch(
                    a=a,
                    b=b,
                    d=d,
                    c='b',
                ))
                a = b

        return tree, max((branch.d+1 for branch in tree), default=0)

    # mtree lookup with this rbyd as the mroot
    def mtree_lookup(self, f, block_size, mbid):
        # have mtree?
        done, rid, tag, w, j, d, data, _ = self.lookup(-1, TAG_MTREE)
        if not done and rid == -1 and tag == TAG_MTREE:
            w, block, trunk, cksum = frombtree(data)
            mtree = Rbyd.fetch(f, block_size, block, trunk)
            # corrupted?
            if not mtree:
                return True, -1, 0, None

            # lookup our mbid
            done, mbid, mw, rbyd, rid, tags, path = mtree.btree_lookup(
                f, block_size, mbid)
            if done:
                return True, -1, 0, None

            mdir = next(((tag, j, d, data)
                for tag, j, d, data in tags
                if tag == TAG_MDIR),
                None)
            if not mdir:
                return True, -1, 0, None

            # fetch the mdir
            _, _, _, data = mdir
            blocks = frommdir(data)
            return False, mbid, mw, Rbyd.fetch(f, block_size, blocks)

        else:
            # have mdir?
            done, rid, tag, w, j, _, data, _ = self.lookup(-1, TAG_MDIR)
            if not done and rid == -1 and tag == TAG_MDIR:
                blocks = frommdir(data)
                return False, 0, 0, Rbyd.fetch(f, block_size, blocks)

            else:
                # I guess we're inlined?
                if mbid == -1:
                    return False, -1, 0, self
                else:
                    return True, -1, 0, None

    # lookup by name
    def namelookup(self, did, name):
        # binary search
        best = (False, -1, 0, 0)
        lower = 0
        upper = self.weight
        while lower < upper:
            done, rid, tag, w, j, d, data, _ = self.lookup(
                lower + (upper-1-lower)//2, TAG_NAME)
            if done:
                break

            # treat vestigial names as a catch-all
            if ((tag == TAG_NAME and rid-(w-1) == 0)
                    or (tag & 0xff00) != TAG_NAME):
                did_ = 0
                name_ = b''
            else:
                did_, d = fromleb128(data)
                name_ = data[d:]

            # bisect search space
            if (did_, name_) > (did, name):
                upper = rid-(w-1)
            elif (did_, name_) < (did, name):
                lower = rid + 1

                # keep track of best match
                best = (False, rid, tag, w)
            else:
                # found a match
                return True, rid, tag, w

        return best

    # lookup by name with this rbyd as the btree root
    def btree_namelookup(self, f, block_size, did, name):
        rbyd = self
        bid = 0

        while True:
            found, rid, tag, w = rbyd.namelookup(did, name)
            done, rid_, tag_, w_, j, d, data, _ = rbyd.lookup(rid, TAG_STRUCT)

            # found another branch
            if tag_ & 0xfff == TAG_BRANCH:
                # update our bid
                bid += rid - (w-1)

                block, trunk, cksum = frombranch(data)
                rbyd = Rbyd.fetch(f, block_size, block, trunk)

            # found best match
            else:
                return bid + rid, tag_, w, data

    # lookup by name with this rbyd as the mroot
    def mtree_namelookup(self, f, block_size, did, name):
        # have mtree?
        done, rid, tag, w, j, d, data, _ = self.lookup(-1, TAG_MTREE)
        if not done and rid == -1 and tag == TAG_MTREE:
            w, block, trunk, cksum = frombtree(data)
            mtree = Rbyd.fetch(f, block_size, block, trunk)
            # corrupted?
            if not mtree:
                return False, -1, 0, None, -1, 0, 0

            # lookup our name in the mtree
            mbid, tag_, mw, data = mtree.btree_namelookup(
                f, block_size, did, name)
            if tag_ != TAG_MDIR:
                return False, -1, 0, None, -1, 0, 0

            # fetch the mdir
            blocks = frommdir(data)
            mdir = Rbyd.fetch(f, block_size, blocks)

        else:
            # have mdir?
            done, rid, tag, w, j, _, data, _ = self.lookup(-1, TAG_MDIR)
            if not done and rid == -1 and tag == TAG_MDIR:
                blocks = frommdir(data)
                mbid = 0
                mw = 0
                mdir = Rbyd.fetch(f, block_size, blocks)

            else:
                # I guess we're inlined?
                mbid = -1
                mw = 0
                mdir = self

        # lookup name in our mdir
        found, rid, tag, w = mdir.namelookup(did, name)
        return found, mbid, mw, mdir, rid, tag, w

    # iterate through a directory assuming this is the mtree root
    def mtree_dir(self, f, block_size, did):
        # lookup the bookmark
        found, mbid, mw, mdir, rid, tag, w = self.mtree_namelookup(
            f, block_size, did, b'')
        # iterate through all files until the next bookmark
        while found:
            # lookup each rid
            done, rid, tag, w, j, d, data, _ = mdir.lookup(rid, TAG_NAME)
            if done:
                break

            # parse out each name
            did_, d_ = fromleb128(data)
            name_ = data[d_:]

            # end if we see another did
            if did_ != did:
                break

            # yield what we've found
            yield name_, mbid, mw, mdir, rid, tag, w

            rid += w
            if rid >= mdir.weight:
                rid -= mdir.weight
                mbid += 1

                done, mbid, mw, mdir = self.mtree_lookup(f, block_size, mbid)
                if done:
                    break


# read the config
class Config:
    def __init__(self, mroot=None):
        # read the config from the mroot
        self.config = {}
        if mroot is not None:
            tag = 0
            while True:
                done, rid, tag, w, j, d, data, _ = mroot.lookup(-1, tag+0x1)
                if done or rid != -1 or (tag & 0xff00) != TAG_CONFIG:
                    break

                self.config[tag] = (j+d, data)

    # accessors for known config
    @ft.cached_property
    def magic(self):
        if TAG_MAGIC in self.config:
            _, data = self.config[TAG_MAGIC]
            return data
        else:
            return None

    @ft.cached_property
    def version(self):
        if TAG_VERSION in self.config:
            _, data = self.config[TAG_VERSION]
            d = 0
            major, d_ = fromleb128(data[d:]); d += d_
            minor, d_ = fromleb128(data[d:]); d += d_
            return (major, minor)
        else:
            return (None, None)

    @ft.cached_property
    def rcompat(self):
        if TAG_RCOMPAT in self.config:
            _, data = self.config[TAG_RCOMPAT]
            return data
        else:
            return None

    @ft.cached_property
    def wcompat(self):
        if TAG_WCOMPAT in self.config:
            _, data = self.config[TAG_WCOMPAT]
            return data
        else:
            return None

    @ft.cached_property
    def ocompat(self):
        if TAG_OCOMPAT in self.config:
            _, data = self.config[TAG_OCOMPAT]
            return data
        else:
            return None

    @ft.cached_property
    def geometry(self):
        if TAG_GEOMETRY in self.config:
            _, data = self.config[TAG_GEOMETRY]
            d = 0
            block_size, d_ = fromleb128(data[d:]); d += d_
            block_count, d_ = fromleb128(data[d:]); d += d_
            return (block_size+1, block_count+1)
        else:
            return (None, None)

    @ft.cached_property
    def name_limit(self):
        if TAG_NAMELIMIT in self.config:
            _, data = self.config[TAG_NAMELIMIT]
            name_limit, _ = fromleb128(data)
            return name_limit
        else:
            return None

    @ft.cached_property
    def size_limit(self):
        if TAG_SIZELIMIT in self.config:
            _, data = self.config[TAG_SIZELIMIT]
            size_limit, _ = fromleb128(data)
            return size_limit
        else:
            return None

    def repr(self):
        def crepr(tag, data):
            if tag == TAG_MAGIC:
                return 'magic \"%s\"' % ''.join(
                    b if b >= ' ' and b <= '~' else '.'
                    for b in map(chr, self.magic))
            elif tag == TAG_VERSION:
                return 'version v%d.%d' % self.version
            elif tag == TAG_RCOMPAT:
                return 'rcompat 0x%s' % ''.join(
                    '%x' % f for f in reversed(self.rcompat))
            elif tag == TAG_WCOMPAT:
                return 'wcompat 0x%s' % ''.join(
                    '%x' % f for f in reversed(self.wcompat))
            elif tag == TAG_OCOMPAT:
                return 'ocompat 0x%s' % ''.join(
                    '%x' % f for f in reversed(self.ocompat))
            elif tag == TAG_GEOMETRY:
                return 'geometry %dx%d' % self.geometry
            elif tag == TAG_SIZELIMIT:
                return 'sizelimit %d' % self.size_limit
            elif tag == TAG_NAMELIMIT:
                return 'namelimit %d' % self.name_limit
            else:
                return 'config 0x%02x %d' % (tag, len(data))

        for tag, (j, data) in sorted(self.config.items()):
            yield crepr(tag, data), tag, j, data


# collect gstate
class GState:
    def __init__(self, mleaf_weight):
        self.gstate = {}
        self.gdelta = {}
        self.mleaf_weight = mleaf_weight

    def xor(self, mbid, mw, mdir):
        tag = TAG_GDELTA-0x1
        while True:
            done, rid, tag, w, j, d, data, _ = mdir.lookup(-1, tag+0x1)
            if done or rid != -1 or (tag & 0xff00) != TAG_GDELTA:
                break

            # keep track of gdeltas
            if tag not in self.gdelta:
                self.gdelta[tag] = []
            self.gdelta[tag].append((mbid, mw, mdir, j, d, data))

            # xor gstate
            if tag not in self.gstate:
                self.gstate[tag] = b''
            self.gstate[tag] = bytes(a^b for a,b in it.zip_longest(
                self.gstate[tag], data, fillvalue=0))

    # parsers for some gstate
    @ft.cached_property
    def grm(self):
        if TAG_GRMDELTA not in self.gstate:
            return []

        data = self.gstate[TAG_GRMDELTA]
        d = 0
        count,  d_ = fromleb128(data[d:]); d += d_
        rms = []
        if count <= 2:
            for _ in range(count):
                mid, d_ = fromleb128(data[d:]); d += d_
                rms.append((
                    mid - (mid % self.mleaf_weight),
                    mid % self.mleaf_weight))
        return rms

    def repr(self):
        def grepr(tag, data):
            if tag == TAG_GRMDELTA:
                count, _ = fromleb128(data)
                return 'grm %s' % (
                    'none' if count == 0
                        else ' '.join('%d.%d' % (mbid//self.mleaf_weight, rid)
                                for mbid, rid in self.grm)
                            if count <= 2
                        else '0x%x %d' % (count, len(data)))
            else:
                return 'gstate 0x%02x %d' % (tag, len(data))

        for tag, data in sorted(self.gstate.items()):
            yield grepr(tag, data), tag, data

def frepr(mdir, rid, tag):
    if tag == TAG_REG or tag == TAG_ORPHAN:
        size = 0
        structs = []
        # inlined data?
        done, rid_, tag_, w_, j, d, data, _ = mdir.lookup(rid, TAG_DATA)
        if not done and rid_ == rid and tag_ == TAG_DATA:
            size = max(size, len(data))
            structs.append('data 0x%x.%x' % (mdir.block, j+d))
        # direct block?
        done, rid_, tag_, w_, j, d, data, _ = mdir.lookup(rid, TAG_BLOCK)
        if not done and rid_ == rid and tag_ == TAG_BLOCK:
            size_, block, off, cksize, cksum = frombptr(data)
            size = max(size, size_)
            structs.append('block 0x%x.%x' % (block, off))
        # inlined bshrub?
        done, rid_, tag_, w_, j, d, data, _ = mdir.lookup(rid, TAG_BSHRUB)
        if not done and rid_ == rid and tag_ == TAG_BSHRUB:
            weight, trunk = fromshrub(data)
            size = max(size, weight)
            structs.append('bshrub 0x%x.%x' % (mdir.block, trunk))
        # indirect btree?
        done, rid_, tag_, w_, j, d, data, _ = mdir.lookup(rid, TAG_BTREE)
        if not done and rid_ == rid and tag_ == TAG_BTREE:
            weight, block, trunk, cksum = frombtree(data)
            size = max(size, weight)
            structs.append('btree 0x%x.%x' % (block, trunk))
        return '%s %s' % (
            'orphan' if tag == TAG_ORPHAN else 'reg',
            ', '.join(it.chain(['%d' % size], structs)))

    elif tag == TAG_DIR:
        # read the did
        did = '?'
        done, rid_, tag_, w_, j, d, data, _ = mdir.lookup(rid, TAG_DID)
        if not done and rid_ == rid and tag_ == TAG_DID:
            did, _ = fromleb128(data)
            did = '0x%x' % did
        return 'dir %s' % did

    elif tag == TAG_BOOKMARK:
        # read the did
        did = '?'
        done, rid_, tag_, w_, j, d, data, _ = mdir.lookup(rid, tag)
        if not done and rid_ == rid and tag_ == tag:
            did, _ = fromleb128(data)
            did = '0x%x' % did
        return 'bookmark %s' % did

    else:
        return 'type 0x%02x' % (tag & 0xff)

def dbg_fstruct(f, block_size, mdir, rid, tag, j, d, data, *,
        m_width=0,
        color=False,
        args={}):
    # first decode possible rbyds/btrees, for sprouts/direct blocks we pretend
    # the entry itself is a single-element btree

    # inlined data?
    if tag == TAG_DATA:
        btree = Rbyd(
            mdir.block,
            mdir.data,
            mdir.rev,
            mdir.eoff,
            j,
            0)
        w = len(data)
    # direct block?
    elif tag == TAG_BLOCK:
        btree = Rbyd(
            mdir.block,
            mdir.data,
            mdir.rev,
            mdir.eoff,
            j,
            0)
        size, block, off, cksize, cksum = frombptr(data)
        w = size
    # inlined bshrub?
    elif tag == TAG_BSHRUB:
        weight, trunk = fromshrub(data)
        btree = Rbyd.fetch(f, block_size, mdir.block, trunk)
        w = weight
    # indirect btree?
    elif tag == TAG_BTREE:
        weight, block, trunk, cksum = frombtree(data)
        btree = Rbyd.fetch(f, block_size, block, trunk)
        w = weight

    # precompute rbyd-trees if requested
    t_width = 0
    if args.get('tree'):
        tree, tdepth = btree.btree_tree(
            f, block_size,
            depth=args.get('struct_depth'),
            inner=args.get('inner'))

    # precompute B-trees if requested
    elif args.get('btree'):
        tree, tdepth = btree.btree_btree(
            f, block_size,
            depth=args.get('struct_depth'),
            inner=args.get('inner'))

    if args.get('tree') or args.get('btree'):
        # map the tree into our block space
        tree_ = set()
        for branch in tree:
            a_bid, a_bd, a_rid, a_tag = branch.a
            b_bid, b_bd, b_rid, b_tag = branch.b
            # flatten non-data tags if we're not showing inner nodes
            if not args.get('inner'):
                if ((a_tag & 0xfff) != TAG_DATA
                        and (a_tag & 0xfff) != TAG_BLOCK):
                    a_tag = (a_tag & 0xf000) | TAG_BLOCK
                if ((b_tag & 0xfff) != TAG_DATA
                        and (b_tag & 0xfff) != TAG_BLOCK):
                    b_tag = (b_tag & 0xf000) | TAG_BLOCK
            tree_.add(TBranch(
                a=(a_bid, a_bd, a_rid, (a_tag & 0xfff) == TAG_BLOCK, a_tag),
                b=(b_bid, b_bd, b_rid, (b_tag & 0xfff) == TAG_BLOCK, b_tag),
                d=branch.d + (1 if args.get('inner') else 0),
                c=branch.c,
            ))
        tree = tree_

        # connect our source tag if we are showing inner nodes
        if ((tag & 0xfff) != TAG_DATA
                and (tag & 0xfff) != TAG_BLOCK
                and args.get('inner')):
            if tree:
                branch = min(tree, key=lambda branch: branch.d)
                a_bid, a_bd, a_rid, a_block, a_tag = branch.a
                tree.add(TBranch(
                    a=(0, -1, 0, False, tag),
                    b=(a_bid, a_bd, a_rid, a_block, a_tag),
                    d=0,
                    c='b'
                ))
            else:
                done, rid_, tag_, w_, j_, d_, data_, _ = btree.lookup(-1, 0)
                if not done:
                    tree.add(TBranch(
                        a=(0, -1, 0, False, tag),
                        b=(rid_-(w_-1), 0, rid_-(w_-1), False, tag_),
                        d=0,
                        c='b'
                    ))

        # we need to do some patching if our tree contains blocks and we're
        # showing inner nodes
        if args.get('inner') and any(branch.b[-1] for branch in tree):
            # find the max depth for each leaf
            bds = {}
            for branch in tree:
                a_bid, a_bd, a_rid, a_block, a_tag = branch.a
                b_bid, b_bd, b_rid, b_block, b_tag = branch.b
                if b_block:
                    bds[branch.b] = max(branch.d, bds.get(branch.b, -1))

            # add branch from block tag to the actual block
            tree_ = set()
            for branch in tree:
                a_bid, a_bd, a_rid, a_block, a_tag = branch.a
                b_bid, b_bd, b_rid, b_block, b_tag = branch.b
                tree_.add(TBranch(
                    a=(a_bid, a_bd, a_rid, False, a_tag),
                    b=(b_bid, b_bd, b_rid, False, b_tag),
                    d=branch.d,
                    c=branch.c,
                ))

                if b_block and branch.d == bds.get(branch.b, -1):
                    tree_.add(TBranch(
                        a=(b_bid, b_bd, b_rid, False, b_tag),
                        b=(b_bid, b_bd, b_rid, True,  b_tag),
                        d=branch.d + 1,
                        c=branch.c,
                    ))
            tree = tree_

    # common tree renderer
    if args.get('tree') or args.get('btree'):
        # find the max depth from the tree
        t_depth = max((branch.d+1 for branch in tree), default=0)
        if t_depth > 0:
            t_width = 2*t_depth + 2

        def treerepr(bid, w, bd, rid, block, tag):
            if t_depth == 0:
                return ''

            def branchrepr(x, d, was):
                for branch in tree:
                    if branch.d == d and branch.b == x:
                        if any(branch.d == d and branch.a == x
                                for branch in tree):
                            return '+-', branch.c, branch.c
                        elif any(branch.d == d
                                and x > min(branch.a, branch.b)
                                and x < max(branch.a, branch.b)
                                for branch in tree):
                            return '|-', branch.c, branch.c
                        elif branch.a < branch.b:
                            return '\'-', branch.c, branch.c
                        else:
                            return '.-', branch.c, branch.c
                for branch in tree:
                    if branch.d == d and branch.a == x:
                        return '+ ', branch.c, None
                for branch in tree:
                    if (branch.d == d
                            and x > min(branch.a, branch.b)
                            and x < max(branch.a, branch.b)):
                        return '| ', branch.c, was
                if was:
                    return '--', was, was
                return '  ', None, None

            trunk = []
            was = None
            for d in range(t_depth):
                t, c, was = branchrepr(
                    (bid-(w-1), bd, rid-(w-1), block, tag), d, was)

                trunk.append('%s%s%s%s' % (
                    '\x1b[33m' if color and c == 'y'
                        else '\x1b[31m' if color and c == 'r'
                        else '\x1b[90m' if color and c == 'b'
                        else '',
                    t,
                    ('>' if was else ' ') if d == t_depth-1 else '',
                    '\x1b[m' if color and c else ''))

            return '%s ' % ''.join(trunk)


    # dynamically size the id field
    w_width = m.ceil(m.log10(max(1, btree.weight)+1))

    # prbyd here means the last rendered rbyd, we update
    # in dbg_branch to always print interleaved addresses
    prbyd = None
    def dbg_branch(bid, w, rbyd, rid, tags, bd):
        nonlocal prbyd

        # show human-readable representation
        for i, (tag, j, d, data) in enumerate(tags):
            print('%12s %*s %s%s%-*s  %s' % (
                '%04x.%04x:' % (rbyd.block, rbyd.trunk)
                    if prbyd is None or rbyd != prbyd
                    else '',
                m_width, '',
                treerepr(bid, w, bd, rid, False, tag)
                    if args.get('tree') or args.get('btree') else '',
                '%*s ' % (2*w_width+1, '' if i != 0
                    else '%d-%d' % (bid-(w-1), bid) if w > 1
                    else bid if w > 0
                    else ''),
                21+2*w_width+1,
                    tagrepr(tag, w if i == 0 else 0, len(data), None),
                next(xxd(data, 8), '')
                    if not args.get('raw') and not args.get('no_truncate')
                    else ''))
            prbyd = rbyd

            # show in-device representation
            if args.get('device'):
                print('%11s  %*s %*s%s%04x %08x %07x' % (
                    '',
                    m_width, '',
                    t_width, '',
                    '%*s ' % (2*w_width+1, ''),
                    tag, w if i == 0 else 0, len(data)))

            # show on-disk encoding of tags/data
            if args.get('raw'):
                for o, line in enumerate(xxd(rbyd.data[j:j+d])):
                    print('%11s: %*s %*s%s%s' % (
                        '%04x' % (j + o*16),
                        m_width, '',
                        t_width, '',
                        '%*s ' % (2*w_width+1, ''),
                        line))
            if args.get('raw') or args.get('no_truncate'):
                for o, line in enumerate(xxd(data)):
                    print('%11s: %*s %*s%s%s' % (
                        '%04x' % (j+d + o*16),
                        m_width, '',
                        t_width, '',
                        '%*s ' % (2*w_width+1, ''),
                        line))

    def dbg_block(bid, w, rbyd, rid, bptr,
            block, off, size, cksize, cksum, data, notes,
            bd):
        nonlocal prbyd
        tag, _, _, _ = bptr

        # show human-readable representation
        print('%s%12s%s %*s %s%s%s%-*s%s%s' % (
            '\x1b[31m' if color and notes else '',
            '%04x.%04x:' % (rbyd.block, rbyd.trunk)
                if prbyd is None or rbyd != prbyd
                else '',
            '\x1b[0m' if color and notes else '',
            m_width, '',
            treerepr(bid, w, bd, rid, True, tag)
                if args.get('tree') or args.get('btree') else '',
            '\x1b[31m' if color and notes else '',
            '%*s ' % (2*w_width+1, '%d-%d' % (bid-(w-1), bid) if w > 1
                else bid if w > 0
                else ''),
            56+2*w_width+1, '%-*s  %s' % (
                21+2*w_width+1, '%s%s%s 0x%x.%x %d' % (
                    'shrub' if tag & TAG_SHRUB else '',
                    'block',
                    ' w%d' % w if w else '',
                    block, off, size),
                next(xxd(data, 8), '')
                    if not args.get('raw') and not args.get('no_truncate')
                    else ''),
            ' (%s)' % ', '.join(notes) if notes else '',
            '\x1b[m' if color and notes else ''))
        prbyd = rbyd

        # show in-device representation
        if args.get('device'):
            _, j, d, data_ = bptr
            print('%11s  %*s %*s%s%04x %08x %07x' % (
                '',
                m_width, '',
                t_width, '',
                '%*s ' % (2*w_width+1, ''),
                tag, w, len(data_)))

        # show on-disk encoding of tags/bptr/data
        if args.get('raw'):
            _, j, d, data_ = bptr
            for o, line in enumerate(xxd(rbyd.data[j:j+d])):
                print('%11s: %*s %*s%s%s' % (
                    '%04x' % (j + o*16),
                    m_width, '',
                    t_width, '',
                    '%*s ' % (2*w_width+1, ''),
                    line))
        if args.get('raw'):
            _, j, d, data_ = bptr
            for o, line in enumerate(xxd(data_)):
                print('%11s: %*s %*s%s%s' % (
                    '%04x' % (j+d + o*16),
                    m_width, '',
                    t_width, '',
                    '%*s ' % (2*w_width+1, ''),
                    line))
        if args.get('raw') or args.get('no_truncate'):
            for o, line in enumerate(xxd(data)):
                print('%11s: %*s %*s%s%s' % (
                    '%04x.%04x' % (block, off + o*16)
                        if o == 0 and block != prbyd.block
                        else '%04x' % (off + o*16),
                    m_width, '',
                    t_width, '',
                    '%*s ' % (2*w_width+1, ''),
                    line))
            # if we show non-truncated file contents we need to
            # reset the rbyd address
            if block != prbyd.block:
                prbyd = None

    # show our source tag? note the big hack here of pretending our
    # entry is a single-element btree
    if tag == TAG_DATA or tag == TAG_BLOCK or args.get('inner'):
        dbg_branch(w-1, w, Rbyd(
            mdir.block,
            mdir.data,
            mdir.rev,
            mdir.eoff,
            j,
            0), w-1, [(tag, j, d, data)], -1)

    # traverse and print entries
    bid = -1
    prbyd = None
    ppath = []
    corrupted = False
    while True:
        done, bid, w, rbyd, rid, tags, path = btree.btree_lookup(
            f, block_size, bid+1, depth=args.get('struct_depth'))
        if done:
            break

        # print inner rbyd entries if requested
        if args.get('inner'):
            changed = False
            for (x, px) in it.zip_longest(
                    enumerate(path[:-1]),
                    enumerate(ppath[:-1])):
                if x is None:
                    break
                if not (changed or px is None or x != px):
                    continue
                changed = True

                # show the inner entry
                d, (bid_, w_, rbyd_, rid_, tags_) = x
                dbg_branch(bid_, w_, rbyd_, rid_, tags_, d)
        ppath = path

        # corrupted? try to keep printing the tree
        if not rbyd:
            print('  %04x.%04x: %*s %*s%s%s%s' % (
                rbyd.block, rbyd.trunk,
                m_width, '',
                t_width, '',
                '\x1b[31m' if color else '',
                '(corrupted rbyd %s)' % rbyd.addr(),
                '\x1b[m' if color else ''))
            prbyd = rbyd
            corrupted = True
            continue

        # if we're not showing inner nodes, prefer names higher in the tree
        # since this avoids showing vestigial names
        if not args.get('inner'):
            name = None
            for bid_, w_, rbyd_, rid_, tags_ in reversed(path):
                for tag_, j_, d_, data_ in tags_:
                    if tag_ & 0x7f00 == TAG_NAME:
                        name = (tag_, j_, d_, data_)

                if rid_-(w_-1) != 0:
                    break

            if name is not None:
                tags = [name] + [(tag, j, d, data)
                    for tag, j, d, data in tags
                    if tag & 0x7f00 != TAG_NAME]

        # found a block in the tags?
        bptr = None
        if (not args.get('struct_depth')
                or len(path) < args.get('struct_depth')):
            bptr = next(((tag, j, d, data)
                for tag, j, d, data in tags
                if (tag & 0xfff) == TAG_BLOCK),
                None)

        # show other btree entries
        if args.get('inner') or not bptr:
            dbg_branch(bid, w, rbyd, rid, tags, len(path)-1)

        if bptr:
            # decode block pointer
            _, _, _, data = bptr
            size, block, off, cksize, cksum = frombptr(data)
            notes = []

            # go ahead and read the full block
            f.seek(block*block_size)
            data = f.read(block_size)

            # check the checksum
            cksum_ = crc32c(data[:cksize])
            if cksum_ != cksum:
                notes.append('cksum!=%08x' % cksum)

            # slice data
            data = data[off:off+size]

            # show the block
            dbg_block(bid, w, rbyd, rid, bptr,
                block, off, size, cksize, cksum, data, notes,
                len(path)-1)


def main(disk, mroots=None, *,
        block_size=None,
        block_count=None,
        color='auto',
        **args):
    # figure out what color should be
    if color == 'auto':
        color = sys.stdout.isatty()
    elif color == 'always':
        color = True
    else:
        color = False

    # is bd geometry specified?
    if isinstance(block_size, tuple):
        block_size, block_count_ = block_size
        if block_count is None:
            block_count = block_count_

    # flatten mroots, default to 0x{0,1}
    if not mroots:
        mroots = [[0,1]]
    mroots = [block for mroots_ in mroots for block in mroots_]

    # we seek around a bunch, so just keep the disk open
    with open(disk, 'rb') as f:
        # if block_size is omitted, assume the block device is one big block
        if block_size is None:
            f.seek(0, os.SEEK_END)
            block_size = f.tell()

        # determine the mleaf_weight from the block_size, this is just for
        # printing purposes
        mleaf_weight = 1 << m.ceil(m.log2(block_size // 8))

        # before we print, we need to do a pass for a few things:
        # - find the actual mroot
        # - find the total weight
        # - are we corrupted?
        # - collect config
        # - collect gstate
        # - any missing or orphaned bookmark entries
        bweight = 0
        rweight = 0
        corrupted = False
        gstate = GState(mleaf_weight)
        config = Config()
        dir_dids = [(0, b'', -1, 0, None, -1, TAG_DID, 0)]
        bookmark_dids = []

        mroot = Rbyd.fetch(f, block_size, mroots)
        mdepth = 1
        while True:
            # corrupted?
            if not mroot:
                corrupted = True
                break

            rweight = max(rweight, mroot.weight)
            # yes we get gstate from all mroots
            gstate.xor(-1, 0, mroot)
            # get the config
            config = Config(mroot)

            # find any dids
            for rid, tag, w, j, d, data in mroot:
                if tag == TAG_DID:
                    did, d = fromleb128(data)
                    dir_dids.append(
                        (did, data[d:], -1, 0, mroot, rid, tag, w))
                elif tag == TAG_BOOKMARK:
                    did, d = fromleb128(data)
                    bookmark_dids.append(
                        (did, data[d:], -1, 0, mroot, rid, tag, w))

            # fetch the next mroot
            done, rid, tag, w, j, d, data, _ = mroot.lookup(-1, TAG_MROOT)
            if not (not done and rid == -1 and tag == TAG_MROOT):
                break

            blocks = frommdir(data)
            mroot = Rbyd.fetch(f, block_size, blocks)
            mdepth += 1

        # fetch the mdir, if there is one
        mdir = None
        done, rid, tag, w, j, _, data, _ = mroot.lookup(-1, TAG_MDIR)
        if not done and rid == -1 and tag == TAG_MDIR:
            blocks = frommdir(data)
            mdir = Rbyd.fetch(f, block_size, blocks)

            # corrupted?
            if not mdir:
                corrupted = True
            else:
                rweight = max(rweight, mdir.weight)
                gstate.xor(0, mdir)

                # find any dids
                for rid, tag, w, j, d, data in mdir:
                    if tag == TAG_DID:
                        did, d = fromleb128(data)
                        dir_dids.append((
                            did, data[d:], 0, 0, mdir, rid, tag, w))
                    elif tag == TAG_BOOKMARK:
                        did, d = fromleb128(data)
                        bookmark_dids.append((
                            did, data[d:], 0, 0, mdir, rid, tag, w))

        # fetch the actual mtree, if there is one
        mtree = None
        done, rid, tag, w, j, d, data, _ = mroot.lookup(-1, TAG_MTREE)
        if not done and rid == -1 and tag == TAG_MTREE:
            w, block, trunk, cksum = frombtree(data)
            mtree = Rbyd.fetch(f, block_size, block, trunk)

            bweight = w

            # traverse entries
            mbid = -1
            while True:
                done, mbid, mw, rbyd, rid, tags, path = mtree.btree_lookup(
                    f, block_size, mbid+1)
                if done:
                    break

                # corrupted?
                if not rbyd:
                    corrupted = True
                    continue

                mdir__ = next(((tag, j, d, data)
                    for tag, j, d, data in tags
                    if tag == TAG_MDIR),
                    None)

                if mdir__:
                    # fetch the mdir
                    _, _, _, data = mdir__
                    blocks = frommdir(data)
                    mdir_ = Rbyd.fetch(f, block_size, blocks)

                    # corrupted?
                    if not mdir_:
                        corrupted = True
                    else:
                        rweight = max(rweight, mdir_.weight)
                        gstate.xor(mbid, mw, mdir_)

                        # find any dids
                        for rid, tag, w, j, d, data in mdir_:
                            if tag == TAG_DID:
                                did, d = fromleb128(data)
                                dir_dids.append((
                                    did, data[d:],
                                    mbid, mw, mdir_, rid, tag, w))
                            elif tag == TAG_BOOKMARK:
                                did, d = fromleb128(data)
                                bookmark_dids.append((
                                    did, data[d:],
                                    mbid, mw, mdir_, rid, tag, w))

        # remove grms from our found dids, we treat these as already deleted
        grmed_dir_dids = {did_
            for (did_, name_, mbid_, mw_, mdir_, rid_, tag_, w_)
            in dir_dids
            if (max(mbid_-max(mw_-1, 0), 0), rid_) not in gstate.grm}
        grmed_bookmark_dids = {did_
            for (did_, name_, mbid_, mw_, mdir_, rid_, tag_, w_)
            in bookmark_dids
            if (max(mbid_-max(mw_-1, 0), 0), rid_) not in gstate.grm}

        # treat the filesystem as corrupted if our dirs and bookmarks are
        # mismatched, this should never happen unless there's a bug
        if grmed_dir_dids != grmed_bookmark_dids:
            corrupted = True

        # are we going to end up rendering the dtree?
        dtree = args.get('files') or not (
            args.get('config') or args.get('gstate'))

        # do a pass to find the width that fits file names+tree, this
        # may not terminate! It's up to the user to use -Z in that case
        f_width = 0
        if dtree:
            def rec_f_width(did, depth):
                depth_ = 0
                width_ = 0
                for name, mbid, mw, mdir, rid, tag, w in mroot.mtree_dir(
                        f, block_size, did):
                    width_ = max(width_, len(name))
                    # recurse?
                    if tag == TAG_DIR and depth > 1:
                        done, rid_, tag_, w_, j, d, data, _ = mdir.lookup(
                            rid, TAG_DID)
                        if not done and rid_ == rid and tag_ == TAG_DID:
                            did_, _ = fromleb128(data)
                            depth__, width__ = rec_f_width(did_, depth-1)
                            depth_ = max(depth_, depth__)
                            width_ = max(width_, width__)
                return 1+depth_, width_

            depth, f_width = rec_f_width(0, args.get('depth') or m.inf)
            # adjust to make space for max depth
            f_width += 4*(depth-1)


        #### actual debugging begins here

        # print some information about the filesystem
        print('littlefs v%s.%s %dx%d %s, rev %d, weight %d.%d' % (
            config.version[0] if config.version[0] is not None else '?',
            config.version[1] if config.version[1] is not None else '?',
            (config.geometry[0] or 0), (config.geometry[1] or 0),
            mroot.addr(), mroot.rev, bweight//mleaf_weight, 1*mleaf_weight))

        # dynamically size the id field
        w_width = max(
            m.ceil(m.log10(max(1, bweight//mleaf_weight)+1)),
            m.ceil(m.log10(max(1, rweight)+1)),
            # in case of -1.-1
            2)

        # print config?
        if args.get('config'):
            for i, (repr_, tag, j, data) in enumerate(config.repr()):
                print('%12s %*s %-*s  %s' % (
                    '{%s}:' % ','.join('%04x' % block
                        for block in it.chain([mroot.block],
                            mroot.redund_blocks))
                        if i == 0 else '',
                    2*w_width+1, '%d.%d' % (-1, -1)
                        if i == 0 else '',
                    21+w_width, repr_,
                    next(xxd(data, 8), '')
                        if not args.get('raw')
                            and not args.get('no_truncate') else ''))

                # show in-device representation
                if args.get('device'):
                    print('%11s  %*s %04x %08x %07x' % (
                        '',
                        2*w_width+1, '',
                        tag, 0, len(data)))

                # show on-disk encoding
                if args.get('raw') or args.get('no_truncate'):
                    for o, line in enumerate(xxd(data)):
                        print('%11s: %*s %s' % (
                            '%04x' % (j + o*16),
                            2*w_width+1, '',
                            line))

        # print gstate?
        if args.get('gstate'):
            for i, (repr_, tag, data) in enumerate(gstate.repr()):
                print('%12s %*s %-*s  %s' % (
                    'gstate:' if i == 0 else '',
                    2*w_width+1, 'g' if i == 0 else '',
                    21+w_width, repr_,
                    next(xxd(data, 8), '')
                        if not args.get('raw')
                            and not args.get('no_truncate') else ''))

                # show in-device representation
                if args.get('device'):
                    print('%11s  %*s %04x %08x %07x' % (
                        '',
                        2*w_width+1, '',
                        tag, 0, len(data)))

                # show on-disk encoding
                if args.get('raw') or args.get('no_truncate'):
                    for o, line in enumerate(xxd(data)):
                        print('%11s: %*s %s' % (
                            '%04x' % (o*16),
                            2*w_width+1, '',
                            line))

                # print gdeltas?
                if args.get('gdelta'):
                    for mbid, mw, mdir, j, d, data in gstate.gdelta[tag]:
                        print('%s%12s %*s %-*s  %s%s' % (
                            '\x1b[90m' if color else '',
                            '{%s}:' % ','.join('%04x' % block
                                for block in it.chain([mdir.block],
                                    mdir.redund_blocks)),
                            2*w_width+1, '%d.%d' % (mbid//mleaf_weight, -1),
                            21+w_width, tagrepr(tag, 0, len(data)),
                            next(xxd(data, 8), '')
                                if not args.get('raw')
                                    and not args.get('no_truncate') else '',
                            '\x1b[m' if color else ''))

                        # show in-device representation
                        if args.get('device'):
                            print('%11s  %*s %04x %08x %07x' % (
                                '',
                                2*w_width+1, '',
                                tag, 0, len(data)))

                        # show on-disk encoding
                        if args.get('raw'):
                            for o, line in enumerate(xxd(mdir.data[j:j+d])):
                                print('%11s: %*s %s' % (
                                    '%04x' % (j + o*16),
                                    2*w_width+1, '',
                                    line))
                        if args.get('raw') or args.get('no_truncate'):
                            for o, line in enumerate(xxd(data)):
                                print('%11s: %*s %s' % (
                                    '%04x' % (j+d + o*16),
                                    2*w_width+1, '',
                                    line))

        # print dtree?
        if dtree:
            # only show mdir on change
            pmbid = None
            # recursively print directories
            def rec_dir(did, depth, prefixes=('', '', '', '')):
                nonlocal pmbid
                # collect all entries first so we know when the dir ends
                dir = []
                for name, mbid, mw, mdir, rid, tag, w in mroot.mtree_dir(
                        f, block_size, did):
                    if not args.get('all'):
                        # skip bookmarks
                        if tag == TAG_BOOKMARK:
                            continue
                        # skip orphans
                        if tag == TAG_ORPHAN:
                            continue
                        # skip grmed entries
                        if (max(mbid-max(mw-1, 0), 0), rid) in gstate.grm:
                            continue
                    dir.append((name, mbid, mw, mdir, rid, tag, w))

                # if we're root, append any orphaned bookmark entries so they
                # get reported
                if did == 0:
                    for did, name, mbid, mw, mdir, rid, tag, w in bookmark_dids:
                        if did in grmed_dir_dids:
                            continue
                        # skip grmed entries
                        if (not args.get('all')
                                and (max(mbid-max(mw-1, 0), 0), rid)
                                    in gstate.grm):
                            continue
                        dir.append((name, mbid, mw, mdir, rid, tag, w))

                for i, (name, mbid, mw, mdir, rid, tag, w) in enumerate(dir):
                    # some special situations worth reporting
                    notes = []
                    grmed = (max(mbid-max(mw-1, 0), 0), rid) in gstate.grm
                    # grmed?
                    if grmed:
                        notes.append('grmed')
                    # missing bookmark?
                    if tag == TAG_DIR:
                        done, rid_, tag_, w_, j, d, data, _ = mdir.lookup(
                            rid, TAG_DID)
                        if not done and rid_ == rid and tag_ == TAG_DID:
                            did_, _ = fromleb128(data)
                            if did_ not in grmed_bookmark_dids:
                                notes.append('missing bookmark')
                        else:
                            notes.append('missing did')
                    # orphaned?
                    if tag == TAG_BOOKMARK:
                        done, rid_, tag_, w_, j, d, data, _ = mdir.lookup(
                            rid, tag)
                        if not done and rid_ == rid and tag_ == tag:
                            did_, _ = fromleb128(data)
                            if did_ not in grmed_dir_dids:
                                notes.append('orphaned')

                    # print human readable dtree entry
                    print('%s%12s %*s %-*s  %s%s%s' % (
                        '\x1b[31m' if color and not grmed and notes
                            else '\x1b[90m'
                                if color and (grmed
                                    or tag == TAG_BOOKMARK
                                    or tag == TAG_ORPHAN)
                            else '',
                        '{%s}:' % ','.join('%04x' % block
                            for block in it.chain([mdir.block],
                                mdir.redund_blocks))
                            if mbid != pmbid else '',
                        2*w_width+1, '%d.%d-%d' % (
                                mbid//mleaf_weight, rid-(w-1), rid)
                            if w > 1 else '%d.%d' % (mbid//mleaf_weight, rid)
                            if w > 0 else '',
                        f_width, '%s%s' % (
                            prefixes[0+(i==len(dir)-1)],
                            name.decode('utf8')),
                        frepr(mdir, rid, tag),
                        ' (%s)' % ', '.join(notes) if notes else '',
                        '\x1b[m' if color and (
                                notes
                                    or grmed
                                    or tag == TAG_BOOKMARK
                                    or tag == TAG_ORPHAN)
                            else ''))
                    pmbid = mbid

                    # print attrs associated with this file?
                    if args.get('attrs'):
                        tag_ = 0
                        while True:
                            done, rid_, tag_, w_, j, d, data, _ = mdir.lookup(
                                rid, tag_+0x1)
                            if done or rid_ != rid:
                                break

                            print('%12s %*s %-*s  %s' % (
                                '',
                                2*w_width+1, '',
                                21+w_width, tagrepr(tag_, w_, len(data)),
                                next(xxd(data, 8), '')
                                    if not args.get('raw')
                                        and not args.get('no_truncate')
                                    else ''))

                            # show in-device representation
                            if args.get('device'):
                                print('%11s  %*s %04x %08x %07x' % (
                                    '',
                                    2*w_width+1, '',
                                    tag_, w_, len(data)))

                            # show on-disk encoding
                            if args.get('raw'):
                                for o, line in enumerate(xxd(mdir.data[j:j+d])):
                                    print('%11s: %*s %s' % (
                                        '%04x' % (j + o*16),
                                        2*w_width+1, '',
                                        line))
                            if args.get('raw') or args.get('no_truncate'):
                                for o, line in enumerate(xxd(data)):
                                    print('%11s: %*s %s' % (
                                        '%04x' % (j+d + o*16),
                                        2*w_width+1, '',
                                        line))

                    # print file contents?
                    if ((tag == TAG_REG or tag == TAG_ORPHAN)
                            and args.get('structs')):
                        # inlined sprout?
                        done, rid_, tag_, w_, j, d, data, _ = mdir.lookup(
                            rid, TAG_DATA)
                        if not done and rid_ == rid and tag_ == TAG_DATA:
                            dbg_fstruct(f, block_size,
                                mdir, rid_, tag_, j, d, data,
                                m_width=2*w_width+1,
                                color=color,
                                args=args)

                        # direct block?
                        done, rid_, tag_, w_, j, d, data, _ = mdir.lookup(
                            rid, TAG_BLOCK)
                        if not done and rid_ == rid and tag_ == TAG_BLOCK:
                            dbg_fstruct(f, block_size,
                                mdir, rid_, tag_, j, d, data,
                                m_width=2*w_width+1,
                                color=color,
                                args=args)

                        # inlined bshrub?
                        done, rid_, tag_, w_, j, d, data, _ = mdir.lookup(
                            rid, TAG_BSHRUB)
                        if not done and rid_ == rid and tag_ == TAG_BSHRUB:
                            dbg_fstruct(f, block_size,
                                mdir, rid_, tag_, j, d, data,
                                m_width=2*w_width+1,
                                color=color,
                                args=args)

                        # indirect btree?
                        done, rid_, tag_, w_, j, d, data, _ = mdir.lookup(
                            rid, TAG_BTREE)
                        if not done and rid_ == rid and tag_ == TAG_BTREE:
                            dbg_fstruct(f, block_size,
                                mdir, rid_, tag_, j, d, data,
                                m_width=2*w_width+1,
                                color=color,
                                args=args)

                    # recurse?
                    if tag == TAG_DIR and depth > 1:
                        done, rid_, tag_, w_, j, d, data, _ = mdir.lookup(
                            rid, TAG_DID)
                        if not done and rid_ == rid and tag_ == TAG_DID:
                            did_, _ = fromleb128(data)
                            rec_dir(
                                did_,
                                depth-1,
                                (prefixes[2+(i==len(dir)-1)] + "|-> ",
                                 prefixes[2+(i==len(dir)-1)] + "'-> ",
                                 prefixes[2+(i==len(dir)-1)] + "|   ",
                                 prefixes[2+(i==len(dir)-1)] + "    "))

            rec_dir(0, args.get('depth') or m.inf)

    if args.get('error_on_corrupt') and corrupted:
        sys.exit(2)


if __name__ == "__main__":
    import argparse
    import sys
    parser = argparse.ArgumentParser(
        description="Debug littlefs stuff.",
        allow_abbrev=False)
    parser.add_argument(
        'disk',
        help="File containing the block device.")
    parser.add_argument(
        'mroots',
        nargs='*',
        type=rbydaddr,
        help="Block address of the mroots. Defaults to 0x{0,1}.")
    parser.add_argument(
        '-b', '--block-size',
        type=bdgeom,
        help="Block size/geometry in bytes.")
    parser.add_argument(
        '--block-count',
        type=lambda x: int(x, 0),
        help="Block count in blocks.")
    parser.add_argument(
        '--color',
        choices=['never', 'always', 'auto'],
        default='auto',
        help="When to use terminal colors. Defaults to 'auto'.")
    parser.add_argument(
        '-c', '--config',
        action='store_true',
        help="Show the on-disk config.")
    parser.add_argument(
        '-g', '--gstate',
        action='store_true',
        help="Show the current global-state.")
    parser.add_argument(
        '-d', '--gdelta',
        action='store_true',
        help="Show the gdelta that xors into the global-state.")
    parser.add_argument(
        '-f', '--files',
        action='store_true',
        help="Show the files and directory tree (default).")
    parser.add_argument(
        '-A', '--attrs',
        action='store_true',
        help="Show all attributes belonging to each file.")
    parser.add_argument(
        '-a', '--all',
        action='store_true',
        help="Show all files including bookmarks and grmed files.")
    parser.add_argument(
        '-r', '--raw',
        action='store_true',
        help="Show the raw data including tag encodings.")
    parser.add_argument(
        '-x', '--device',
        action='store_true',
        help="Show the device-side representation of tags.")
    parser.add_argument(
        '-T', '--no-truncate',
        action='store_true',
        help="Don't truncate, show the full contents.")
    parser.add_argument(
        '-z', '--depth',
        nargs='?',
        type=lambda x: int(x, 0),
        const=0,
        help="Depth of the filesystem tree to show.")
    parser.add_argument(
        '-s', '--structs',
        action='store_true',
        help="Store file data structures and data.")
    parser.add_argument(
        '-t', '--tree',
        action='store_true',
        help="Show the underlying rbyd trees.")
    parser.add_argument(
        '-B', '--btree',
        action='store_true',
        help="Show the underlying B-tree.")
    parser.add_argument(
        '-i', '--inner',
        action='store_true',
        help="Show inner branches.")
    parser.add_argument(
        '-Z', '--struct-depth',
        nargs='?',
        type=lambda x: int(x, 0),
        const=0,
        help="Depth of struct trees to show.")
    parser.add_argument(
        '-e', '--error-on-corrupt',
        action='store_true',
        help="Error if the filesystem is corrupt.")
    sys.exit(main(**{k: v
        for k, v in vars(parser.parse_intermixed_args()).items()
        if v is not None}))