2 files changed, 33 insertions, 64 deletions
diff --git a/qutebrowser/misc/elf.py b/qutebrowser/misc/elf.py
index aa717e790..35af5af28 100644
--- a/qutebrowser/misc/elf.py
+++ b/qutebrowser/misc/elf.py
@@ -44,21 +44,16 @@ This is a "best effort" parser. If it errors out, we instead end up relying on t
 PyQtWebEngine version, which is the next best thing.
 """
 
-import struct
 import enum
 import re
 import dataclasses
 import mmap
 import pathlib
-from typing import Any, IO, ClassVar, Dict, Optional, Tuple, cast
+from typing import IO, ClassVar, Dict, Optional, cast
 
 from qutebrowser.qt import machinery
 from qutebrowser.utils import log, version, qtutils
-
-
-class ParseError(Exception):
-
-    """Raised when the ELF file can't be parsed."""
+from qutebrowser.misc import binparsing
 
 
 class Bitness(enum.Enum):
@@ -77,33 +72,6 @@ class Endianness(enum.Enum):
     big = 2
 
 
-def _unpack(fmt: str, fobj: IO[bytes]) -> Tuple[Any, ...]:
-    """Unpack the given struct format from the given file."""
-    size = struct.calcsize(fmt)
-    data = _safe_read(fobj, size)
-
-    try:
-        return struct.unpack(fmt, data)
-    except struct.error as e:
-        raise ParseError(e)
-
-
-def _safe_read(fobj: IO[bytes], size: int) -> bytes:
-    """Read from a file, handling possible exceptions."""
-    try:
-        return fobj.read(size)
-    except (OSError, OverflowError) as e:
-        raise ParseError(e)
-
-
-def _safe_seek(fobj: IO[bytes], pos: int) -> None:
-    """Seek in a file, handling possible exceptions."""
-    try:
-        fobj.seek(pos)
-    except (OSError, OverflowError) as e:
-        raise ParseError(e)
-
-
 @dataclasses.dataclass
 class Ident:
 
@@ -125,17 +93,17 @@ class Ident:
     @classmethod
     def parse(cls, fobj: IO[bytes]) -> 'Ident':
         """Parse an ELF ident header from a file."""
-        magic, klass, data, elfversion, osabi, abiversion = _unpack(cls._FORMAT, fobj)
+        magic, klass, data, elfversion, osabi, abiversion = binparsing.unpack(cls._FORMAT, fobj)
 
         try:
             bitness = Bitness(klass)
         except ValueError:
-            raise ParseError(f"Invalid bitness {klass}")
+            raise binparsing.ParseError(f"Invalid bitness {klass}")
 
         try:
             endianness = Endianness(data)
         except ValueError:
-            raise ParseError(f"Invalid endianness {data}")
+            raise binparsing.ParseError(f"Invalid endianness {data}")
 
         return cls(magic, bitness, endianness, elfversion, osabi, abiversion)
 
@@ -172,7 +140,7 @@ class Header:
     def parse(cls, fobj: IO[bytes], bitness: Bitness) -> 'Header':
         """Parse an ELF header from a file."""
         fmt = cls._FORMATS[bitness]
-        return cls(*_unpack(fmt, fobj))
+        return cls(*binparsing.unpack(fmt, fobj))
 
 
 @dataclasses.dataclass
@@ -203,39 +171,39 @@ class SectionHeader:
     def parse(cls, fobj: IO[bytes], bitness: Bitness) -> 'SectionHeader':
         """Parse an ELF section header from a file."""
         fmt = cls._FORMATS[bitness]
-        return cls(*_unpack(fmt, fobj))
+        return cls(*binparsing.unpack(fmt, fobj))
 
 
 def get_rodata_header(f: IO[bytes]) -> SectionHeader:
     """Parse an ELF file and find the .rodata section header."""
     ident = Ident.parse(f)
     if ident.magic != b'\x7fELF':
-        raise ParseError(f"Invalid magic {ident.magic!r}")
+        raise binparsing.ParseError(f"Invalid magic {ident.magic!r}")
 
     if ident.data != Endianness.little:
-        raise ParseError("Big endian is unsupported")
+        raise binparsing.ParseError("Big endian is unsupported")
 
     if ident.version != 1:
-        raise ParseError(f"Only version 1 is supported, not {ident.version}")
+        raise binparsing.ParseError(f"Only version 1 is supported, not {ident.version}")
 
     header = Header.parse(f, bitness=ident.klass)
 
     # Read string table
-    _safe_seek(f, header.shoff + header.shstrndx * header.shentsize)
+    binparsing.safe_seek(f, header.shoff + header.shstrndx * header.shentsize)
     shstr = SectionHeader.parse(f, bitness=ident.klass)
 
-    _safe_seek(f, shstr.offset)
-    string_table = _safe_read(f, shstr.size)
+    binparsing.safe_seek(f, shstr.offset)
+    string_table = binparsing.safe_read(f, shstr.size)
 
     # Back to all sections
     for i in range(header.shnum):
-        _safe_seek(f, header.shoff + i * header.shentsize)
+        binparsing.safe_seek(f, header.shoff + i * header.shentsize)
         sh = SectionHeader.parse(f, bitness=ident.klass)
         name = string_table[sh.name:].split(b'\x00')[0]
         if name == b'.rodata':
             return sh
 
-    raise ParseError("No .rodata section found")
+    raise binparsing.ParseError("No .rodata section found")
 
 
 @dataclasses.dataclass
@@ -262,7 +230,7 @@ def _find_versions(data: bytes) -> Versions:
                 chromium=match.group(2).decode('ascii'),
             )
         except UnicodeDecodeError as e:
-            raise ParseError(e)
+            raise binparsing.ParseError(e)
 
     # Here it gets even more crazy: Sometimes, we don't have the full UA in one piece
     # in the string table somehow (?!). However, Qt 6.2 added a separate
@@ -273,20 +241,20 @@ def _find_versions(data: bytes) -> Versions:
     # We first get the partial Chromium version from the UA:
     match = re.search(pattern[:-4], data)  # without trailing literal \x00
     if match is None:
-        raise ParseError("No match in .rodata")
+        raise binparsing.ParseError("No match in .rodata")
 
     webengine_bytes = match.group(1)
     partial_chromium_bytes = match.group(2)
     if b"." not in partial_chromium_bytes or len(partial_chromium_bytes) < 6:
         # some sanity checking
-        raise ParseError("Inconclusive partial Chromium bytes")
+        raise binparsing.ParseError("Inconclusive partial Chromium bytes")
 
     # And then try to find the *full* string, stored separately, based on the
     # partial one we got above.
     pattern = br"\x00(" + re.escape(partial_chromium_bytes) + br"[0-9.]+)\x00"
     match = re.search(pattern, data)
     if match is None:
-        raise ParseError("No match in .rodata for full version")
+        raise binparsing.ParseError("No match in .rodata for full version")
 
     chromium_bytes = match.group(1)
     try:
@@ -295,7 +263,7 @@ def _find_versions(data: bytes) -> Versions:
             chromium=chromium_bytes.decode('ascii'),
         )
     except UnicodeDecodeError as e:
-        raise ParseError(e)
+        raise binparsing.ParseError(e)
 
 
 def _parse_from_file(f: IO[bytes]) -> Versions:
@@ -316,8 +284,8 @@ def _parse_from_file(f: IO[bytes]) -> Versions:
             return _find_versions(cast(bytes, mmap_data))
     except (OSError, OverflowError) as e:
         log.misc.debug(f"mmap failed ({e}), falling back to reading", exc_info=True)
-        _safe_seek(f, sh.offset)
-        data = _safe_read(f, sh.size)
+        binparsing.safe_seek(f, sh.offset)
+        data = binparsing.safe_read(f, sh.size)
         return _find_versions(data)
 
 
@@ -344,6 +312,6 @@ def parse_webenginecore() -> Optional[Versions]:
 
         log.misc.debug(f"Got versions from ELF: {versions}")
         return versions
-    except ParseError as e:
+    except binparsing.ParseError as e:
         log.misc.debug(f"Failed to parse ELF: {e}", exc_info=True)
         return None
diff --git a/qutebrowser/misc/pakjoy.py b/qutebrowser/misc/pakjoy.py
index 084ab46bd..78d02550a 100644
--- a/qutebrowser/misc/pakjoy.py
+++ b/qutebrowser/misc/pakjoy.py
@@ -36,16 +36,17 @@ from qutebrowser.utils import qtutils, standarddir, version, utils, log
 
 HANGOUTS_MARKER = b"// Extension ID: nkeimhogjdpnpccoofpliimaahmaaome"
 HANGOUTS_ID = 36197  # as found by toofar
+PAK_VERSION = 5
 
 TARGET_URL = b"https://*.google.com/*"
-REPLACEMENT_URL = b"https://*.qb.invalid/*"
+REPLACEMENT_URL = b"https://qute.invalid/*"
 assert len(TARGET_URL) == len(REPLACEMENT_URL)
 
 
 @dataclasses.dataclass
-class Pak5Header:
+class PakHeader:
 
-    """Chromium .pak header."""
+    """Chromium .pak header (version 5)."""
 
     encoding: int  # uint32
     resource_count: int  # uint16
@@ -54,7 +55,7 @@ class Pak5Header:
     _FORMAT: ClassVar[str] = '<IHH'
 
     @classmethod
-    def parse(cls, fobj: IO[bytes]) -> 'Pak5Header':
+    def parse(cls, fobj: IO[bytes]) -> 'PakHeader':
         """Parse a PAK version 5 header from a file."""
         return cls(*binparsing.unpack(cls._FORMAT, fobj))
 
@@ -82,7 +83,7 @@ class PakParser:
     def __init__(self, fobj: IO[bytes]) -> None:
         """Parse the .pak file from the given file object."""
         pak_version = binparsing.unpack("<I", fobj)[0]
-        if pak_version != 5:
+        if pak_version != PAK_VERSION:
             raise binparsing.ParseError(f"Unsupported .pak version {pak_version}")
 
         self.fobj = fobj
@@ -113,7 +114,7 @@ class PakParser:
         """Read the header and entry index from the .pak file."""
         entries = []
 
-        header = Pak5Header.parse(self.fobj)
+        header = PakHeader.parse(self.fobj)
         for _ in range(header.resource_count + 1):  # + 1 due to sentinel at end
             entries.append(PakEntry.parse(self.fobj))
 
@@ -135,9 +136,9 @@ class PakParser:
             if manifest is not None:
                 return suspected_entry, manifest
 
-        # didn't find it via the previously known ID, let's search them all...
-        for id_ in entries:
-            manifest = self._maybe_get_hangouts_manifest(entries[id_])
+        # didn't find it via the prevously known ID, let's search them all...
+        for entry in entries.values():
+            manifest = self._maybe_get_hangouts_manifest(entry)
             if manifest is not None:
                 return entries[id_], manifest