SickGear/lib/hachoir_py3/parser/misc/ole2.py

"""
Microsoft Office documents parser.
OLE2 files are also used by many other programs to store data.

Informations:
* wordole.c of AntiWord program (v0.35)
  Copyright (C) 1998-2003 A.J. van Os
  Released under GNU GPL
  http://www.winfield.demon.nl/
* File gsf-infile-msole.c of libgsf library (v1.14.0)
  Copyright (C) 2002-2004 Jody Goldberg (jody@gnome.org)
  Released under GNU LGPL 2.1
  http://freshmeat.net/projects/libgsf/
* PDF from AAF Association
  Copyright (C) 2004 AAF Association
  Copyright (C) 1991-2003 Microsoft Corporation
  http://www.aafassociation.org/html/specs/aafcontainerspec-v1.0.1.pdf

Author: Victor Stinner
Creation: 2006-04-23
"""

from hachoir_py3.parser import HachoirParser
from hachoir_py3.field import (
    FieldSet, ParserError, SeekableFieldSet, RootSeekableFieldSet,
    UInt8, UInt16, UInt32, UInt64, TimestampWin64, Enum,
    Bytes, NullBytes, String, CustomFragment)
from hachoir_py3.core.text_handler import filesizeHandler
from hachoir_py3.core.endian import LITTLE_ENDIAN
from hachoir_py3.parser.common.win32 import GUID
from hachoir_py3.parser.misc.msoffice import PROPERTY_NAME, RootEntry, RawParser

MIN_BIG_BLOCK_LOG2 = 6   # 512 bytes
MAX_BIG_BLOCK_LOG2 = 14  # 64 kB

# Number of items in DIFAT
NB_DIFAT = 109


class SECT(UInt32):
    UNUSED = 0xFFFFFFFF   # -1
    END_OF_CHAIN = 0xFFFFFFFE   # -2
    BFAT_SECTOR = 0xFFFFFFFD   # -3
    DIFAT_SECTOR = 0xFFFFFFFC   # -4
    SPECIALS = set((END_OF_CHAIN, UNUSED, BFAT_SECTOR, DIFAT_SECTOR))

    special_value_name = {
        UNUSED: "unused",
        END_OF_CHAIN: "end of a chain",
        BFAT_SECTOR: "BFAT sector (in a FAT)",
        DIFAT_SECTOR: "DIFAT sector (in a FAT)",
    }

    def __init__(self, parent, name, description=None):
        UInt32.__init__(self, parent, name, description)

    def createDisplay(self):
        val = self.value
        return SECT.special_value_name.get(val, str(val))


class Property(FieldSet):
    TYPE_ROOT = 5
    TYPE_NAME = {
        1: "storage",
        2: "stream",
        3: "ILockBytes",
        4: "IPropertyStorage",
        5: "root"
    }
    DECORATOR_NAME = {
        0: "red",
        1: "black",
    }
    static_size = 128 * 8

    def createFields(self):
        bytes = self.stream.readBytes(self.absolute_address, 4)
        if bytes == b"\0R\0\0":
            charset = "UTF-16-BE"
        else:
            charset = "UTF-16-LE"
        yield String(self, "name", 64, charset=charset, truncate="\0")
        yield UInt16(self, "namelen", "Length of the name")
        yield Enum(UInt8(self, "type", "Property type"), self.TYPE_NAME)
        yield Enum(UInt8(self, "decorator", "Decorator"), self.DECORATOR_NAME)
        yield SECT(self, "left")
        yield SECT(self, "right")
        yield SECT(self, "child", "Child node (valid for storage and root types)")
        yield GUID(self, "clsid", "CLSID of this storage (valid for storage and root types)")
        yield NullBytes(self, "flags", 4, "User flags")
        yield TimestampWin64(self, "creation", "Creation timestamp(valid for storage and root types)")
        yield TimestampWin64(self, "lastmod", "Modify timestamp (valid for storage and root types)")
        yield SECT(self, "start", "Starting SECT of the stream (valid for stream and root types)")
        if self["/header/bb_shift"].value == 9:
            yield filesizeHandler(UInt32(self, "size", "Size in bytes (valid for stream and root types)"))
            yield NullBytes(self, "padding", 4)
        else:
            yield filesizeHandler(UInt64(self, "size", "Size in bytes (valid for stream and root types)"))

    def createDescription(self):
        name = self["name"].display
        size = self["size"].display
        return "Property: %s (%s)" % (name, size)


class DIFat(SeekableFieldSet):

    def __init__(self, parent, name, db_start, db_count, description=None):
        SeekableFieldSet.__init__(self, parent, name, description)
        self.start = db_start
        self.count = db_count

    def createFields(self):
        for index in range(NB_DIFAT):
            yield SECT(self, "index[%u]" % index)

        difat_sect = self.start
        index = NB_DIFAT
        entries_per_sect = self.parent.sector_size // 32 - 1
        for ctr in range(self.count):
            # this is relative to real DIFAT start
            self.seekBit(NB_DIFAT * SECT.static_size +
                         self.parent.sector_size * difat_sect)
            for sect_index in range(entries_per_sect):
                yield SECT(self, "index[%u]" % (index + sect_index))
            index += entries_per_sect
            next = SECT(self, "difat[%u]" % ctr)
            yield next
            difat_sect = next.value


class Header(FieldSet):
    static_size = 68 * 8

    def createFields(self):
        yield GUID(self, "clsid", "16 bytes GUID used by some apps")
        yield UInt16(self, "ver_min", "Minor version")
        yield UInt16(self, "ver_maj", "Major version")
        yield Bytes(self, "endian", 2, "Endian (\\xfe\\xff for little endian)")
        yield UInt16(self, "bb_shift", "Log, base 2, of the big block size")
        yield UInt16(self, "sb_shift", "Log, base 2, of the small block size")
        yield NullBytes(self, "reserved[]", 6, "(reserved)")
        yield UInt32(self, "csectdir", "Number of SECTs in directory chain for 4 KB sectors (version 4)")
        yield UInt32(self, "bb_count", "Number of Big Block Depot blocks")
        yield SECT(self, "bb_start", "Root start block")
        yield NullBytes(self, "transaction", 4, "Signature used for transactions (must be zero)")
        yield UInt32(self, "threshold", "Maximum size for a mini stream (typically 4096 bytes)")
        yield SECT(self, "sb_start", "Small Block Depot start block")
        yield UInt32(self, "sb_count")
        yield SECT(self, "db_start", "First block of DIFAT")
        yield UInt32(self, "db_count", "Number of SECTs in DIFAT")


# Header (ole_id, header, difat) size in bytes
HEADER_SIZE = 64 + Header.static_size + NB_DIFAT * SECT.static_size


class SectFat(FieldSet):

    def __init__(self, parent, name, start, count, description=None):
        FieldSet.__init__(self, parent, name, description, size=count * 32)
        self.count = count
        self.start = start

    def createFields(self):
        for i in range(self.start, self.start + self.count):
            yield SECT(self, "index[%u]" % i)


class OLE2_File(HachoirParser, RootSeekableFieldSet):
    PARSER_TAGS = {
        "id": "ole2",
        "category": "misc",
        "file_ext": (
            "db",                        # Thumbs.db
            "doc", "dot",                # Microsoft Word
            "ppt", "ppz", "pps", "pot",  # Microsoft Powerpoint
            "xls", "xla",                # Microsoft Excel
            "msi",                       # Windows installer
        ),
        "mime": (
            "application/msword",
            "application/msexcel",
            "application/mspowerpoint",
        ),
        "min_size": 512 * 8,
        "description": "Microsoft Office document",
        "magic": ((b"\xD0\xCF\x11\xE0\xA1\xB1\x1A\xE1", 0),),
    }
    endian = LITTLE_ENDIAN

    def __init__(self, stream, **args):
        RootSeekableFieldSet.__init__(
            self, None, "root", stream, None, stream.askSize(self))
        HachoirParser.__init__(self, stream, **args)

    def close(self):
        self.stream.close()

    def __enter__(self):
        return self

    def __exit__(self, type, value, traceback):
        self.close()

    def validate(self):
        if self["ole_id"].value != b"\xD0\xCF\x11\xE0\xA1\xB1\x1A\xE1":
            return "Invalid magic"
        if self["header/ver_maj"].value not in (3, 4):
            return "Unknown major version (%s)" % self["header/ver_maj"].value
        if self["header/endian"].value not in (b"\xFF\xFE", b"\xFE\xFF"):
            return "Unknown endian (%s)" % self["header/endian"].raw_display
        if not(MIN_BIG_BLOCK_LOG2 <= self["header/bb_shift"].value <= MAX_BIG_BLOCK_LOG2):
            return "Invalid (log 2 of) big block size (%s)" % self["header/bb_shift"].value
        if self["header/bb_shift"].value < self["header/sb_shift"].value:
            return "Small block size (log2=%s) is bigger than big block size (log2=%s)!" \
                % (self["header/sb_shift"].value, self["header/bb_shift"].value)
        return True

    def createFields(self):
        # Signature
        yield Bytes(self, "ole_id", 8, "OLE object signature")

        header = Header(self, "header")
        yield header

        # Configure values
        self.sector_size = (8 << header["bb_shift"].value)
        self.fat_count = header["bb_count"].value
        self.items_per_bbfat = self.sector_size // SECT.static_size
        self.ss_size = (8 << header["sb_shift"].value)
        self.items_per_ssfat = self.items_per_bbfat

        # Read DIFAT (one level of indirection)
        yield DIFat(self, "difat", header["db_start"].value, header["db_count"].value, "Double Indirection FAT")

        # Read FAT (one level of indirection)
        yield from self.readBFAT()

        # Read SFAT
        yield from self.readSFAT()

        # Read properties
        chain = self.getChain(self["header/bb_start"].value)
        prop_per_sector = self.sector_size // Property.static_size
        self.properties = []
        for block in chain:
            self.seekBlock(block)
            for index in range(prop_per_sector):
                property = Property(self, "property[]")
                yield property
                self.properties.append(property)

        # Parse first property
        for index, property in enumerate(self.properties):
            if index == 0:
                name, parser = 'root', RootEntry
            else:
                try:
                    name, parser = PROPERTY_NAME[property["name"].value]
                except LookupError:
                    name = property.name + "content"
                    parser = RawParser
            yield from self.parseProperty(property, name, parser)

    def parseProperty(self, property, name_prefix, parser=RawParser):
        if not property["size"].value:
            return
        if property["size"].value < self["header/threshold"].value and name_prefix != 'root':
            return
        name = "%s[]" % name_prefix
        first = None
        previous = None
        size = 0
        fragment_group = None
        chain = self.getChain(property["start"].value)
        while True:
            try:
                block = next(chain)
                contiguous = False
                if first is None:
                    first = block
                    contiguous = True
                if previous is not None and block == (previous + 1):
                    contiguous = True
                if contiguous:
                    previous = block
                    size += self.sector_size
                    continue
            except StopIteration:
                block = None
            if first is None:
                break
            self.seekBlock(first)
            desc = "Big blocks %s..%s (%s)" % (
                first, previous, previous - first + 1)
            desc += " of %s bytes" % (self.sector_size // 8)
            field = CustomFragment(
                self, name, size, parser, desc, fragment_group)
            if not fragment_group:
                fragment_group = field.group
                fragment_group.args["ole2"] = field.root
                fragment_group.args["datasize"] = property["size"].value
                fragment_group.args["ole2name"] = property["name"].value
            yield field
            if block is None:
                break
            first = block
            previous = block
            size = self.sector_size

    def getChain(self, start, use_sfat=False):
        if use_sfat:
            fat = self.ss_fat
            items_per_fat = self.items_per_ssfat
            err_prefix = "SFAT chain"
        else:
            fat = self.bb_fat
            items_per_fat = self.items_per_bbfat
            err_prefix = "BFAT chain"
        block = start
        block_set = set()
        previous = block
        while block != SECT.END_OF_CHAIN:
            if block in SECT.SPECIALS:
                raise ParserError("%s: Invalid block index (0x%08x), previous=%s" % (
                    err_prefix, block, previous))
            if block in block_set:
                raise ParserError("%s: Found a loop (%s=>%s)" %
                                  (err_prefix, previous, block))
            block_set.add(block)
            yield block
            previous = block
            index = block // items_per_fat
            try:
                block = fat[index]["index[%u]" % block].value
            except LookupError:
                break

    def readBFAT(self):
        self.bb_fat = []
        start = 0
        count = self.items_per_bbfat
        for index, block in enumerate(self.array("difat/index")):
            block = block.value
            if block == SECT.UNUSED:
                break

            desc = "FAT %u/%u at block %u" % \
                (1 + index, self["header/bb_count"].value, block)

            self.seekBlock(block)
            field = SectFat(self, "bbfat[]", start, count, desc)
            yield field
            self.bb_fat.append(field)

            start += count

    def readSFAT(self):
        chain = self.getChain(self["header/sb_start"].value)
        start = 0
        self.ss_fat = []
        count = self.items_per_ssfat
        for index, block in enumerate(chain):
            self.seekBlock(block)
            field = SectFat(self, "sfat[]",
                            start, count,
                            "SFAT %u/%u at block %u" %
                            (1 + index, self["header/sb_count"].value, block))
            yield field
            self.ss_fat.append(field)
            start += count

    def createContentSize(self):
        max_block = 0
        for fat in self.array("bbfat"):
            for entry in fat:
                block = entry.value
                if block not in SECT.SPECIALS:
                    max_block = max(block, max_block)
        if max_block in SECT.SPECIALS:
            return None
        else:
            return HEADER_SIZE + (max_block + 1) * self.sector_size

    def seekBlock(self, block):
        self.seekBit(HEADER_SIZE + block * self.sector_size)
Change core system to improve performance and facilitate multi TV info sources. Change migrate core objects TVShow and TVEpisode and everywhere that these objects affect. Add message to logs and disable ui backlog buttons when no media provider has active and/or scheduled searching enabled. Change views for py3 compat. Change set default runtime of 5 mins if none is given for layout Day by Day. Add OpenSubtitles authentication support to config/Subtitles/Subtitles Plugin. Add "Enforce media hash match" to config/Subtitles Plugin/Opensubtitles for accurate subs if enabled, but if disabled, search failures will fallback to use less reliable subtitle results. Add Apprise 0.8.0 (6aa52c3). Add hachoir_py3 3.0a6 (5b9e05a). Add sgmllib3k 1.0.0 Update soupsieve 1.9.1 (24859cc) to soupsieve_py2 1.9.5 (6a38398) Add soupsieve_py3 2.0.0.dev (69194a2). Add Tornado_py3 Web Server 6.0.3 (ff985fe). Add xmlrpclib_to 0.1.1 (c37db9e). Remove ancient Growl lib 0.1 Remove xmltodict library. Change requirements.txt for Cheetah3 to minimum 3.2.4 Change update sabToSickBeard. Change update autoProcessTV. Change remove Twitter notifier. Update NZBGet Process Media extension, SickGear-NG 1.7 → 2.4 Update Kodi addon 1.0.3 → 1.0.4 Update ADBA for py3. Update Beautiful Soup 4.8.0 (r526) to 4.8.1 (r531). Update Send2Trash 1.3.0 (a568370) to 1.5.0 (66afce7). Update soupsieve 1.9.1 (24859cc) to 1.9.5 (6a38398). Change use GNTP (Growl Notification Transport Protocol) from Apprise. Change add multi host support to Growl notifier. Fix Growl notifier when using empty password. Change update links for Growl notifications. Change deprecate confg/Notifications/Growl password field as these are now stored with host setting. Fix prevent infinite memoryError from a particular jpg data structure. Change subliminal for py3. Change enzyme for py3. Change browser_ua for py3. Change feedparser for py3 (sgmlib is no longer available on py3 as standardlib so added ext lib) Fix Guessit. Fix parse_xml for py3. Fix name parser with multi eps for py3. Fix tvdb_api fixes for py3 (search show). Fix config/media process to only display "pattern is invalid" qtip on "Episode naming" tab if the associated field is actually visible. Also, if the field becomes hidden due to a setting change, hide any previously displayed qtip. Note for Javascript::getelementbyid (or $('tag[id="<name>"')) is required when an id is being searched in the dom due to ":" used in a shows id name. Change download anidb xml files to main cache folder and use adba lib folder as a last resort. Change create get anidb show groups as centralised helper func and consolidate dupe code. Change move anidb related functions to newly renamed anime.py (from blacklistandwhitelist.py). Change str encode hex no longer exits in py3, use codecs.encode(...) instead. Change fix b64decode on py3 returns bytestrings. Change use binary read when downloading log file via browser to prevent any encoding issues. Change add case insensitive ordering to anime black/whitelist. Fix anime groups list not excluding whitelisted stuff. Change add Windows utf8 fix ... see: ytdl-org/youtube-dl#820 Change if no qualities are wanted, exit manual search thread. Fix keepalive for py3 process media. Change add a once a month update of tvinfo show mappings to the daily updater. Change autocorrect ids of new shows by updating from -8 to 31 days of the airdate of episode one. Add next run time to Manage/Show Tasks/Daily show update. Change when fetching imdb data, if imdb id is an episode id then try to find and use real show id. Change delete diskcache db in imdbpie when value error (due to change in Python version). Change during startup, cleanup any _cleaner.pyc/o to prevent issues when switching python versions. Add .pyc cleaner if python version is switched. Change replace deprecated gettz_db_metadata() and gettz. Change rebrand "SickGear PostProcessing script" to "SickGear Process Media extension". Change improve setup guide to use the NZBGet version to minimise displayed text based on version. Change NZBGet versions prior to v17 now told to upgrade as those version are no longer supported - code has actually exit on start up for some time but docs were outdated. Change comment out code and unused option sg_base_path. Change supported Python version 2.7.9-2.7.18 inclusive expanded to 3.7.1-3.8.1 inclusive. Change pidfile creation under Linux 0o644. Make logger accept lists to output continuously using the log_lock instead of split up by other processes. Fix long path issues with Windows process media. 6 years ago			`"""`
			`Microsoft Office documents parser.`
			`OLE2 files are also used by many other programs to store data.`

			`Informations:`
			`* wordole.c of AntiWord program (v0.35)`
			`Copyright (C) 1998-2003 A.J. van Os`
			`Released under GNU GPL`
			`http://www.winfield.demon.nl/`
			`* File gsf-infile-msole.c of libgsf library (v1.14.0)`
			`Copyright (C) 2002-2004 Jody Goldberg (jody@gnome.org)`
			`Released under GNU LGPL 2.1`
			`http://freshmeat.net/projects/libgsf/`
			`* PDF from AAF Association`
			`Copyright (C) 2004 AAF Association`
			`Copyright (C) 1991-2003 Microsoft Corporation`
			`http://www.aafassociation.org/html/specs/aafcontainerspec-v1.0.1.pdf`

			`Author: Victor Stinner`
			`Creation: 2006-04-23`
			`"""`

			`from hachoir_py3.parser import HachoirParser`
			`from hachoir_py3.field import (`
			`FieldSet, ParserError, SeekableFieldSet, RootSeekableFieldSet,`
			`UInt8, UInt16, UInt32, UInt64, TimestampWin64, Enum,`
			`Bytes, NullBytes, String, CustomFragment)`
			`from hachoir_py3.core.text_handler import filesizeHandler`
			`from hachoir_py3.core.endian import LITTLE_ENDIAN`
			`from hachoir_py3.parser.common.win32 import GUID`
			`from hachoir_py3.parser.misc.msoffice import PROPERTY_NAME, RootEntry, RawParser`

			`MIN_BIG_BLOCK_LOG2 = 6 # 512 bytes`
			`MAX_BIG_BLOCK_LOG2 = 14 # 64 kB`

			`# Number of items in DIFAT`
			`NB_DIFAT = 109`


			`class SECT(UInt32):`
			`UNUSED = 0xFFFFFFFF # -1`
			`END_OF_CHAIN = 0xFFFFFFFE # -2`
			`BFAT_SECTOR = 0xFFFFFFFD # -3`
			`DIFAT_SECTOR = 0xFFFFFFFC # -4`
			`SPECIALS = set((END_OF_CHAIN, UNUSED, BFAT_SECTOR, DIFAT_SECTOR))`

			`special_value_name = {`
			`UNUSED: "unused",`
			`END_OF_CHAIN: "end of a chain",`
			`BFAT_SECTOR: "BFAT sector (in a FAT)",`
			`DIFAT_SECTOR: "DIFAT sector (in a FAT)",`
			`}`

			`def __init__(self, parent, name, description=None):`
			`UInt32.__init__(self, parent, name, description)`

			`def createDisplay(self):`
			`val = self.value`
			`return SECT.special_value_name.get(val, str(val))`


			`class Property(FieldSet):`
			`TYPE_ROOT = 5`
			`TYPE_NAME = {`
			`1: "storage",`
			`2: "stream",`
			`3: "ILockBytes",`
			`4: "IPropertyStorage",`
			`5: "root"`
			`}`
			`DECORATOR_NAME = {`
			`0: "red",`
			`1: "black",`
			`}`
			`static_size = 128 * 8`

			`def createFields(self):`
			`bytes = self.stream.readBytes(self.absolute_address, 4)`
			`if bytes == b"\0R\0\0":`
			`charset = "UTF-16-BE"`
			`else:`
			`charset = "UTF-16-LE"`
			`yield String(self, "name", 64, charset=charset, truncate="\0")`
			`yield UInt16(self, "namelen", "Length of the name")`
			`yield Enum(UInt8(self, "type", "Property type"), self.TYPE_NAME)`
			`yield Enum(UInt8(self, "decorator", "Decorator"), self.DECORATOR_NAME)`
			`yield SECT(self, "left")`
			`yield SECT(self, "right")`
			`yield SECT(self, "child", "Child node (valid for storage and root types)")`
			`yield GUID(self, "clsid", "CLSID of this storage (valid for storage and root types)")`
			`yield NullBytes(self, "flags", 4, "User flags")`
			`yield TimestampWin64(self, "creation", "Creation timestamp(valid for storage and root types)")`
			`yield TimestampWin64(self, "lastmod", "Modify timestamp (valid for storage and root types)")`
			`yield SECT(self, "start", "Starting SECT of the stream (valid for stream and root types)")`
			`if self["/header/bb_shift"].value == 9:`
			`yield filesizeHandler(UInt32(self, "size", "Size in bytes (valid for stream and root types)"))`
			`yield NullBytes(self, "padding", 4)`
			`else:`
			`yield filesizeHandler(UInt64(self, "size", "Size in bytes (valid for stream and root types)"))`

			`def createDescription(self):`
			`name = self["name"].display`
			`size = self["size"].display`
			`return "Property: %s (%s)" % (name, size)`


			`class DIFat(SeekableFieldSet):`

			`def __init__(self, parent, name, db_start, db_count, description=None):`
			`SeekableFieldSet.__init__(self, parent, name, description)`
			`self.start = db_start`
			`self.count = db_count`

			`def createFields(self):`
			`for index in range(NB_DIFAT):`
			`yield SECT(self, "index[%u]" % index)`

			`difat_sect = self.start`
			`index = NB_DIFAT`
			`entries_per_sect = self.parent.sector_size // 32 - 1`
			`for ctr in range(self.count):`
			`# this is relative to real DIFAT start`
			`self.seekBit(NB_DIFAT * SECT.static_size +`
			`self.parent.sector_size * difat_sect)`
			`for sect_index in range(entries_per_sect):`
			`yield SECT(self, "index[%u]" % (index + sect_index))`
			`index += entries_per_sect`
			`next = SECT(self, "difat[%u]" % ctr)`
			`yield next`
			`difat_sect = next.value`


			`class Header(FieldSet):`
			`static_size = 68 * 8`

			`def createFields(self):`
			`yield GUID(self, "clsid", "16 bytes GUID used by some apps")`
			`yield UInt16(self, "ver_min", "Minor version")`
			`yield UInt16(self, "ver_maj", "Major version")`
			`yield Bytes(self, "endian", 2, "Endian (\\xfe\\xff for little endian)")`
			`yield UInt16(self, "bb_shift", "Log, base 2, of the big block size")`
			`yield UInt16(self, "sb_shift", "Log, base 2, of the small block size")`
			`yield NullBytes(self, "reserved[]", 6, "(reserved)")`
			`yield UInt32(self, "csectdir", "Number of SECTs in directory chain for 4 KB sectors (version 4)")`
			`yield UInt32(self, "bb_count", "Number of Big Block Depot blocks")`
			`yield SECT(self, "bb_start", "Root start block")`
			`yield NullBytes(self, "transaction", 4, "Signature used for transactions (must be zero)")`
			`yield UInt32(self, "threshold", "Maximum size for a mini stream (typically 4096 bytes)")`
			`yield SECT(self, "sb_start", "Small Block Depot start block")`
			`yield UInt32(self, "sb_count")`
			`yield SECT(self, "db_start", "First block of DIFAT")`
			`yield UInt32(self, "db_count", "Number of SECTs in DIFAT")`


			`# Header (ole_id, header, difat) size in bytes`
			`HEADER_SIZE = 64 + Header.static_size + NB_DIFAT * SECT.static_size`


			`class SectFat(FieldSet):`

			`def __init__(self, parent, name, start, count, description=None):`
			`FieldSet.__init__(self, parent, name, description, size=count * 32)`
			`self.count = count`
			`self.start = start`

			`def createFields(self):`
			`for i in range(self.start, self.start + self.count):`
			`yield SECT(self, "index[%u]" % i)`


			`class OLE2_File(HachoirParser, RootSeekableFieldSet):`
			`PARSER_TAGS = {`
			`"id": "ole2",`
			`"category": "misc",`
			`"file_ext": (`
			`"db", # Thumbs.db`
			`"doc", "dot", # Microsoft Word`
			`"ppt", "ppz", "pps", "pot", # Microsoft Powerpoint`
			`"xls", "xla", # Microsoft Excel`
			`"msi", # Windows installer`
			`),`
			`"mime": (`
			`"application/msword",`
			`"application/msexcel",`
			`"application/mspowerpoint",`
			`),`
			`"min_size": 512 * 8,`
			`"description": "Microsoft Office document",`
			`"magic": ((b"\xD0\xCF\x11\xE0\xA1\xB1\x1A\xE1", 0),),`
			`}`
			`endian = LITTLE_ENDIAN`

			`def __init__(self, stream, **args):`
			`RootSeekableFieldSet.__init__(`
			`self, None, "root", stream, None, stream.askSize(self))`
			`HachoirParser.__init__(self, stream, **args)`

			`def close(self):`
			`self.stream.close()`

			`def __enter__(self):`
			`return self`

			`def __exit__(self, type, value, traceback):`
			`self.close()`

			`def validate(self):`
			`if self["ole_id"].value != b"\xD0\xCF\x11\xE0\xA1\xB1\x1A\xE1":`
			`return "Invalid magic"`
			`if self["header/ver_maj"].value not in (3, 4):`
			`return "Unknown major version (%s)" % self["header/ver_maj"].value`
			`if self["header/endian"].value not in (b"\xFF\xFE", b"\xFE\xFF"):`
			`return "Unknown endian (%s)" % self["header/endian"].raw_display`
			`if not(MIN_BIG_BLOCK_LOG2 <= self["header/bb_shift"].value <= MAX_BIG_BLOCK_LOG2):`
			`return "Invalid (log 2 of) big block size (%s)" % self["header/bb_shift"].value`
			`if self["header/bb_shift"].value < self["header/sb_shift"].value:`
			`return "Small block size (log2=%s) is bigger than big block size (log2=%s)!" \`
			`% (self["header/sb_shift"].value, self["header/bb_shift"].value)`
			`return True`

			`def createFields(self):`
			`# Signature`
			`yield Bytes(self, "ole_id", 8, "OLE object signature")`

			`header = Header(self, "header")`
			`yield header`

			`# Configure values`
			`self.sector_size = (8 << header["bb_shift"].value)`
			`self.fat_count = header["bb_count"].value`
			`self.items_per_bbfat = self.sector_size // SECT.static_size`
			`self.ss_size = (8 << header["sb_shift"].value)`
			`self.items_per_ssfat = self.items_per_bbfat`

			`# Read DIFAT (one level of indirection)`
			`yield DIFat(self, "difat", header["db_start"].value, header["db_count"].value, "Double Indirection FAT")`

			`# Read FAT (one level of indirection)`
			`yield from self.readBFAT()`

			`# Read SFAT`
			`yield from self.readSFAT()`

			`# Read properties`
			`chain = self.getChain(self["header/bb_start"].value)`
			`prop_per_sector = self.sector_size // Property.static_size`
			`self.properties = []`
			`for block in chain:`
			`self.seekBlock(block)`
			`for index in range(prop_per_sector):`
			`property = Property(self, "property[]")`
			`yield property`
			`self.properties.append(property)`

			`# Parse first property`
			`for index, property in enumerate(self.properties):`
			`if index == 0:`
			`name, parser = 'root', RootEntry`
			`else:`
			`try:`
			`name, parser = PROPERTY_NAME[property["name"].value]`
			`except LookupError:`
			`name = property.name + "content"`
			`parser = RawParser`
			`yield from self.parseProperty(property, name, parser)`

			`def parseProperty(self, property, name_prefix, parser=RawParser):`
			`if not property["size"].value:`
			`return`
			`if property["size"].value < self["header/threshold"].value and name_prefix != 'root':`
			`return`
			`name = "%s[]" % name_prefix`
			`first = None`
			`previous = None`
			`size = 0`
			`fragment_group = None`
			`chain = self.getChain(property["start"].value)`
			`while True:`
			`try:`
			`block = next(chain)`
			`contiguous = False`
			`if first is None:`
			`first = block`
			`contiguous = True`
			`if previous is not None and block == (previous + 1):`
			`contiguous = True`
			`if contiguous:`
			`previous = block`
			`size += self.sector_size`
			`continue`
			`except StopIteration:`
			`block = None`
			`if first is None:`
			`break`
			`self.seekBlock(first)`
			`desc = "Big blocks %s..%s (%s)" % (`
			`first, previous, previous - first + 1)`
			`desc += " of %s bytes" % (self.sector_size // 8)`
			`field = CustomFragment(`
			`self, name, size, parser, desc, fragment_group)`
			`if not fragment_group:`
			`fragment_group = field.group`
			`fragment_group.args["ole2"] = field.root`
			`fragment_group.args["datasize"] = property["size"].value`
			`fragment_group.args["ole2name"] = property["name"].value`
			`yield field`
			`if block is None:`
			`break`
			`first = block`
			`previous = block`
			`size = self.sector_size`

			`def getChain(self, start, use_sfat=False):`
			`if use_sfat:`
			`fat = self.ss_fat`
			`items_per_fat = self.items_per_ssfat`
			`err_prefix = "SFAT chain"`
			`else:`
			`fat = self.bb_fat`
			`items_per_fat = self.items_per_bbfat`
			`err_prefix = "BFAT chain"`
			`block = start`
			`block_set = set()`
			`previous = block`
			`while block != SECT.END_OF_CHAIN:`
			`if block in SECT.SPECIALS:`
			`raise ParserError("%s: Invalid block index (0x%08x), previous=%s" % (`
			`err_prefix, block, previous))`
			`if block in block_set:`
			`raise ParserError("%s: Found a loop (%s=>%s)" %`
			`(err_prefix, previous, block))`
			`block_set.add(block)`
			`yield block`
			`previous = block`
			`index = block // items_per_fat`
			`try:`
			`block = fat[index]["index[%u]" % block].value`
			`except LookupError:`
			`break`

			`def readBFAT(self):`
			`self.bb_fat = []`
			`start = 0`
			`count = self.items_per_bbfat`
			`for index, block in enumerate(self.array("difat/index")):`
			`block = block.value`
			`if block == SECT.UNUSED:`
			`break`

			`desc = "FAT %u/%u at block %u" % \`
			`(1 + index, self["header/bb_count"].value, block)`

			`self.seekBlock(block)`
			`field = SectFat(self, "bbfat[]", start, count, desc)`
			`yield field`
			`self.bb_fat.append(field)`

			`start += count`

			`def readSFAT(self):`
			`chain = self.getChain(self["header/sb_start"].value)`
			`start = 0`
			`self.ss_fat = []`
			`count = self.items_per_ssfat`
			`for index, block in enumerate(chain):`
			`self.seekBlock(block)`
			`field = SectFat(self, "sfat[]",`
			`start, count,`
			`"SFAT %u/%u at block %u" %`
			`(1 + index, self["header/sb_count"].value, block))`
			`yield field`
			`self.ss_fat.append(field)`
			`start += count`

			`def createContentSize(self):`
			`max_block = 0`
			`for fat in self.array("bbfat"):`
			`for entry in fat:`
			`block = entry.value`
			`if block not in SECT.SPECIALS:`
			`max_block = max(block, max_block)`
			`if max_block in SECT.SPECIALS:`
			`return None`
			`else:`
			`return HEADER_SIZE + (max_block + 1) * self.sector_size`

			`def seekBlock(self, block):`
			`self.seekBit(HEADER_SIZE + block * self.sector_size)`