""" .torrent metainfo file parser http://wiki.theory.org/BitTorrentSpecification#Metainfo_File_Structure Status: To statufy Author: Christophe Gisquet """ from hachoir.parser import Parser from hachoir.field import (FieldSet, ParserError, String, RawBytes) from hachoir.core.endian import LITTLE_ENDIAN from hachoir.core.tools import makePrintable, timestampUNIX, humanFilesize # Maximum number of bytes for string length MAX_STRING_LENGTH = 6 # length in 0..999999 # Maximum number of bytes for integer value MAX_INTEGER_SIZE = 21 # 21 decimal digits (or "-" sign and 20 digits) class Integer(FieldSet): # ie def createFields(self): yield String(self, "start", 1, "Integer start delimiter (i)", charset="ASCII") # Find integer end addr = self.absolute_address + self.current_size len = self.stream.searchBytesLength( b'e', False, addr, addr + (MAX_INTEGER_SIZE + 1) * 8) if len is None: raise ParserError( "Torrent: Unable to find integer end delimiter (e)!") if not len: raise ParserError("Torrent: error, empty integer!") yield String(self, "value", len, "Integer value", charset="ASCII") yield String(self, "end", 1, "Integer end delimiter") def createValue(self): """Read integer value (may raise ValueError)""" return int(self["value"].value) class TorrentString(FieldSet): # : def createFields(self): addr = self.absolute_address len = self.stream.searchBytesLength( b':', False, addr, addr + (MAX_STRING_LENGTH + 1) * 8) if len is None: raise ParserError("Torrent: unable to find string separator (':')") if not len: raise ParserError("Torrent: error: no string length!") val = String(self, "length", len, "String length") yield val try: len = int(val.value) except ValueError: len = -1 if len < 0: raise ParserError("Invalid string length (%s)" % makePrintable(val.value, "ASCII")) yield String(self, "separator", 1, "String length/value separator") if not len: self.info("Empty string: len=%i" % len) return if len < 512: yield String(self, "value", len, "String value", charset="ISO-8859-1") else: # Probably raw data yield RawBytes(self, "value", len, "Raw data") def createValue(self): if "value" in self: field = self["value"] if field.__class__ != RawBytes: return field.value else: return None else: return None class Dictionary(FieldSet): # de def createFields(self): yield String(self, "start", 1, "Dictionary start delimiter (d)", charset="ASCII") while self.stream.readBytes(self.absolute_address + self.current_size, 1) != b"e": yield DictionaryItem(self, "item[]") yield String(self, "end", 1, "Dictionary end delimiter") class List(FieldSet): # le def createFields(self): yield String(self, "start", 1, "List start delimiter") while self.stream.readBytes(self.absolute_address + self.current_size, 1) != b"e": yield Entry(self, "item[]") yield String(self, "end", 1, "List end delimiter") class DictionaryItem(FieldSet): def __init__(self, *args): FieldSet.__init__(self, *args) # TODO: Remove this because it's not lazy? key = self["key"] if not key.hasValue(): return key = key.value self._name = str(key).replace(" ", "_") def createDisplay(self): if not self["value"].hasValue(): return None if self._name in ("length", "piece_length"): return humanFilesize(self.value) return FieldSet.createDisplay(self) def createValue(self): if not self["value"].hasValue(): return None if self._name == "creation_date": return self.createTimestampValue() else: return self["value"].value def createFields(self): yield Entry(self, "key") yield Entry(self, "value") def createTimestampValue(self): return timestampUNIX(self["value"].value) # Map first chunk byte => type TAGS = {b'd': Dictionary, b'i': Integer, b'l': List} for index in range(0, 9 + 1): TAGS[str(index).encode('ascii')] = TorrentString # Create an entry def Entry(parent, name): addr = parent.absolute_address + parent.current_size tag = parent.stream.readBytes(addr, 1) if tag not in TAGS: raise ParserError("Torrent: Entry of type %r not handled" % tag) cls = TAGS[tag] return cls(parent, name) class TorrentFile(Parser): endian = LITTLE_ENDIAN MAGIC = b"d8:announce" PARSER_TAGS = { "id": "torrent", "category": "misc", "file_ext": ("torrent",), "min_size": 50 * 8, "mime": ("application/x-bittorrent",), "magic": ((MAGIC, 0),), "description": "Torrent metainfo file" } def validate(self): if self.stream.readBytes(0, len(self.MAGIC)) != self.MAGIC: return "Invalid magic" return True def createFields(self): yield Dictionary(self, "root", size=self.size)