diff --git a/kloppy/io.py b/kloppy/io.py
index d2ca20e0..0726f99c 100644
--- a/kloppy/io.py
+++ b/kloppy/io.py
@@ -1,19 +1,22 @@
 """I/O utilities for reading raw data."""
+
+import bz2
 import contextlib
+import gzip
 import logging
+import lzma
 import os
 import urllib.parse
 from dataclasses import dataclass, replace
-from io import BytesIO, BufferedIOBase
-from pathlib import PurePath
+from io import BufferedWriter, BytesIO, TextIOWrapper
 from typing import (
     IO,
     BinaryIO,
+    ContextManager,
+    Generator,
+    Optional,
     Tuple,
     Union,
-    Optional,
-    Generator,
-    ContextManager,
 )
 
 from kloppy.config import get_config
@@ -22,43 +25,13 @@
 
 logger = logging.getLogger(__name__)
 
+DEFAULT_GZIP_COMPRESSION = 1
+DEFAULT_BZ2_COMPRESSION = 9
+DEFAULT_XZ_COMPRESSION = 6
 
-def _open(file: str, mode: str) -> IO:
-    if file.endswith(".gz"):
-        import gzip
-
-        return gzip.open(file, mode)
-    elif file.endswith(".xz"):
-        import lzma
-
-        return lzma.open(file, mode)
-    elif file.endswith(".bz2"):
-        import bz2
-
-        return bz2.open(file, mode)
-    return open(file, mode)
 
-
-def _decompress(stream: BinaryIO) -> BinaryIO:
-    stream.seek(0)
-    if stream.read(3) == b"\x1f\x8b\x08":
-        import gzip
-
-        stream.seek(0)
-        print("GZIP")
-        return gzip.GzipFile(fileobj=stream, mode="rb")
-    elif stream.read(6) == b"\xfd7zXZ\x00":
-        import lzma
-
-        stream.seek(0)
-        return lzma.LZMAFile(stream)
-    elif stream.read(3) == b"BZh":
-        import bz2
-
-        stream.seek(0)
-        return bz2.BZ2File(stream)
-    stream.seek(0)
-    return stream
+FilePath = Union[str, bytes, os.PathLike]
+FileOrPath = Union[FilePath, IO]
 
 
 @dataclass(frozen=True)
@@ -74,7 +47,7 @@ class Source:
         >>> open_as_file(Source.create("example.csv", optional=True))
     """
 
-    data: "FileLike"
+    data: FileOrPath
     optional: bool = False
     skip_if_missing: bool = False
 
@@ -85,14 +58,227 @@ def create(cls, input_: "FileLike", **kwargs):
         return Source(data=input_, **kwargs)
 
 
-FileLike = Union[str, PurePath, bytes, BinaryIO, Source]
+FileLike = Union[FileOrPath, Source]
+
+
+def _file_or_path_to_binary_stream(
+    file_or_path: FileOrPath, binary_mode: str
+) -> Tuple[BinaryIO, bool]:
+    """
+    Converts a file path or a file-like object to a binary stream.
+
+    Args:
+        file_or_path: The file path or file-like object to convert.
+        binary_mode: The binary mode to open the file in. Must be one of 'rb', 'wb', or 'ab'.
+
+    Returns:
+        A tuple containing the binary stream and a boolean indicating whether
+        a new file was opened (True) or an existing file-like object was used (False).
+    """
+    assert binary_mode in ("rb", "wb", "ab")
+
+    if isinstance(file_or_path, (str, bytes)) or hasattr(
+        file_or_path, "__fspath__"
+    ):
+        # If file_or_path is a path-like object, open it and return the binary stream
+        return open(os.fspath(file_or_path), binary_mode), True  # type: ignore
+
+    if isinstance(file_or_path, TextIOWrapper):
+        # If file_or_path is a TextIOWrapper, return its underlying binary buffer
+        return file_or_path.buffer, False
+
+    if hasattr(file_or_path, "readinto") or hasattr(file_or_path, "write"):
+        # If file_or_path is a file-like object, return it as is
+        return file_or_path, False  # type: ignore
+
+    raise TypeError(
+        f"Unsupported type for {file_or_path}, "
+        f"{file_or_path.__class__.__name__}."
+    )
+
+
+def _detect_format_from_content(file_or_path: FileOrPath) -> Optional[str]:
+    """
+    Attempts to detect file format from the content by reading the first
+    6 bytes. Returns None if no format could be detected.
+    """
+    fileobj, closefd = _file_or_path_to_binary_stream(file_or_path, "rb")
+    try:
+        if not fileobj.readable():
+            return None
+        if hasattr(fileobj, "peek"):
+            bs = fileobj.peek(6)
+        elif hasattr(fileobj, "seekable") and fileobj.seekable():
+            current_pos = fileobj.tell()
+            bs = fileobj.read(6)
+            fileobj.seek(current_pos)
+        else:
+            return None
+
+        if bs[:2] == b"\x1f\x8b":
+            # https://tools.ietf.org/html/rfc1952#page-6
+            return "gz"
+        elif bs[:3] == b"\x42\x5a\x68":
+            # https://en.wikipedia.org/wiki/List_of_file_signatures
+            return "bz2"
+        elif bs[:6] == b"\xfd\x37\x7a\x58\x5a\x00":
+            # https://tukaani.org/xz/xz-file-format.txt
+            return "xz"
+        return None
+    finally:
+        if closefd:
+            fileobj.close()
+
+
+def _detect_format_from_extension(filename: FilePath) -> Optional[str]:
+    """
+    Attempt to detect file format from the filename extension.
+    Return None if no format could be detected.
+    """
+    extensions = ("bz2", "xz", "gz")
+
+    if isinstance(filename, bytes):
+        for ext in extensions:
+            if filename.endswith(b"." + ext.encode()):
+                return ext
+
+    if isinstance(filename, str):
+        for ext in extensions:
+            if filename.endswith("." + ext):
+                return ext
+
+    if hasattr(filename, "name"):
+        return _detect_format_from_extension(filename.name)
+
+    return None
+
+
+def _filepath_from_path_or_filelike(file_or_path: FileOrPath) -> str:
+    try:
+        return os.fspath(file_or_path)  # type: ignore
+    except TypeError:
+        pass
 
+    if hasattr(file_or_path, "name"):
+        name = file_or_path.name
+        if isinstance(name, str):
+            return name
+        elif isinstance(name, bytes):
+            return name.decode()
 
-def get_file_extension(f: FileLike) -> str:
+    return ""
+
+
+def _open(
+    filename: FileOrPath,
+    mode: str = "rb",
+    compresslevel: Optional[int] = None,
+    format: Optional[str] = None,
+) -> BinaryIO:
+    """
+    A replacement for the "open" function that can also read and write
+    compressed files transparently. The supported compression formats are gzip,
+    bzip2 and xz. Filename can be a string, a Path or a file object.
+
+    When writing, the file format is chosen based on the file name extension:
+    - .gz uses gzip compression
+    - .bz2 uses bzip2 compression
+    - .xz uses xz/lzma compression
+    - otherwise, no compression is used
+
+    When reading, if a file name extension is available, the format is detected
+    using it, but if not, the format is detected from the contents.
+
+    mode can be: 'rb', 'ab', or 'wb'.
+
+    compresslevel is the compression level for writing to gzip, and xz.
+    This parameter is ignored for the other compression formats.
+    If set to None, a default depending on the format is used:
+    gzip: 6, xz: 6.
+
+    format overrides the autodetection of input and output formats. This can be
+    useful when compressed output needs to be written to a file without an
+    extension. Possible values are "gz", "xz", "bz2" and "raw". In case of
+    "raw", no compression is used.
+    """
+    if mode not in ("rb", "wb", "ab"):
+        raise ValueError("Mode '{}' not supported".format(mode))
+    filepath = _filepath_from_path_or_filelike(filename)
+
+    if format not in (None, "gz", "xz", "bz2", "raw"):
+        raise ValueError(
+            f"Format not supported: {format}. Choose one of: 'gz', 'xz', 'bz2'"
+        )
+
+    if format == "raw":
+        detected_format = None
+    else:
+        detected_format = format or _detect_format_from_extension(filepath)
+        if detected_format is None and "r" in mode:
+            detected_format = _detect_format_from_content(filename)
+
+    if detected_format == "gz":
+        opened_file = _open_gz(filename, mode, compresslevel)
+    elif detected_format == "xz":
+        opened_file = _open_xz(filename, mode, compresslevel)
+    elif detected_format == "bz2":
+        opened_file = _open_bz2(filename, mode, compresslevel)
+    else:
+        opened_file, _ = _file_or_path_to_binary_stream(filename, mode)
+
+    return opened_file
+
+
+def _open_bz2(
+    filename: FileOrPath,
+    mode: str,
+    compresslevel: Optional[int] = None,
+) -> BinaryIO:
+    assert mode in ("rb", "ab", "wb")
+    if compresslevel is None:
+        compresslevel = DEFAULT_BZ2_COMPRESSION
+
+    if "r" in mode:
+        return bz2.open(filename, mode)  # type: ignore
+    return BufferedWriter(bz2.open(filename, mode, compresslevel))  # type: ignore
+
+
+def _open_xz(
+    filename: FileOrPath,
+    mode: str,
+    compresslevel: Optional[int] = None,
+) -> BinaryIO:
+    assert mode in ("rb", "ab", "wb")
+    if compresslevel is None:
+        compresslevel = DEFAULT_XZ_COMPRESSION
+
+    if "r" in mode:
+        return lzma.open(filename, mode)  # type: ignore
+    return BufferedWriter(lzma.open(filename, mode, preset=compresslevel))  # type: ignore
+
+
+def _open_gz(
+    filename: FileOrPath,
+    mode: str,
+    compresslevel: Optional[int] = None,
+) -> BinaryIO:
+    assert mode in ("rb", "ab", "wb")
+    if compresslevel is None:
+        compresslevel = DEFAULT_GZIP_COMPRESSION
+
+    if "r" in mode:
+        return gzip.open(filename, mode)  # type: ignore
+    return BufferedWriter(gzip.open(filename, mode, compresslevel=compresslevel))  # type: ignore
+
+
+def get_file_extension(file_or_path: FileLike) -> str:
     """Determine the file extension of the given file-like object.
 
+    If the file has compression extensions such as '.gz', '.xz', or '.bz2',
+    they will be stripped before determining the extension.
+
     Args:
-        f (FileLike): The file-like object whose extension needs to be determined.
+        file_or_path (FileLike): The file-like object whose extension needs to be determined.
 
     Returns:
         str: The file extension, including the dot ('.') if present.
@@ -100,10 +286,6 @@ def get_file_extension(f: FileLike) -> str:
     Raises:
         Exception: If the extension cannot be determined.
 
-    Note:
-        - If the file has compression extensions such as '.gz', '.xz', or
-          '.bz2', they will be stripped before determining the extension.
-
     Example:
         >>> get_file_extension("example.xml.gz")
         '.xml'
@@ -112,26 +294,39 @@ def get_file_extension(f: FileLike) -> str:
         >>> get_file_extension(Source(data="example.csv"))
         '.csv'
     """
-    if isinstance(f, PurePath) or isinstance(f, str):
-        f = str(f)
+    if isinstance(file_or_path, (str, bytes)) or hasattr(
+        file_or_path, "__fspath__"
+    ):
+        path = os.fspath(file_or_path)  # type: ignore
         for ext in [".gz", ".xz", ".bz2"]:
-            if f.endswith(ext):
-                f = f[: -len(ext)]
-        return os.path.splitext(f)[1]
-    elif isinstance(f, Source):
-        return get_file_extension(f.data)
-    else:
-        raise Exception("Could not determine extension")
+            if path.endswith(ext):
+                path = path[: -len(ext)]
+        return os.path.splitext(path)[1]
+
+    if isinstance(file_or_path, Source):
+        return get_file_extension(file_or_path.data)
+
+    raise TypeError(
+        f"Could not determine extension for input type: {type(file_or_path)}"
+    )
 
 
 def get_local_cache_stream(
-    url: str, cache_dir: str
+    url: str, cache_dir: str, mode: str = "rb", format: Optional[str] = None
 ) -> Tuple[BinaryIO, Union[bool, str]]:
     """Get a stream to the local cache file for the given URL.
 
+    Compressed files are read transparently. The supported compression formats
+    are gzip, bzip2 and xz.
+
     Args:
         url (str): The URL to cache.
         cache_dir (str): The directory where the cache file will be stored.
+        mode (str): The mode in which to open the cache file. Must be one of
+            'rb', 'wb', or 'ab'. Defaults to 'ab'.
+        format (str): Overrides the autodetection of input and output formats.
+            Possible values are "gz", "xz", "bz2" and "raw". In case of "raw",
+            no compression is used..
 
     Returns:
         Tuple[BinaryIO, bool | str]: A tuple containing a binary stream to the
@@ -146,22 +341,23 @@ def get_local_cache_stream(
     Example:
         >>> stream, exists = get_local_cache_stream("https://example.com/data", "./cache")
     """
+    assert mode in ("rb", "wb", "ab")
+
+    # Ensure the cache directory exists
     if not os.path.exists(cache_dir):
         os.makedirs(cache_dir)
 
+    # Generate the local filename based on the URL
     filename = urllib.parse.quote_plus(url)
     local_filename = f"{cache_dir}/{filename}"
 
-    # Open the file in append+read mode
-    # this makes sure:
-    # 1. The file is created when it does not exist
-    # 2. The file is not truncated when it does exist
-    # 3. The file can be read
-    return open(local_filename, "a+b"), (
-        os.path.exists(local_filename)
-        and os.path.getsize(local_filename) > 0
-        and local_filename
+    # Ensure the file exists by opening it in append-binary mode, creating it if necessary
+    file_exists_and_non_empty = (
+        os.path.exists(local_filename) and os.path.getsize(local_filename) > 0
     )
+    file = _open(local_filename, mode, format=format)
+
+    return file, file_exists_and_non_empty
 
 
 @contextlib.contextmanager
@@ -193,6 +389,7 @@ def open_as_file(input_: FileLike) -> ContextManager[Optional[BinaryIO]]:
 
     Raises:
         InputNotFoundError: If the input file is not found.
+        TypeError: If the input type is not supported.
 
     Example:
         >>> with open_as_file("example.txt") as f:
@@ -217,40 +414,56 @@ def open_as_file(input_: FileLike) -> ContextManager[Optional[BinaryIO]]:
                 logging.info(f"Input {input_.data} not found. Skipping")
                 return dummy_context_mgr()
             raise
-    elif isinstance(input_, str) and ("{" in input_ or "<" in input_):
+
+    if isinstance(input_, str) and ("{" in input_ or "<" in input_):
+        # If input_ is a JSON or XML string, return it as a binary stream
         return BytesIO(input_.encode("utf8"))
-    elif isinstance(input_, bytes):
+
+    if isinstance(input_, bytes):
+        # If input_ is a bytes object, return it as a binary stream
         return BytesIO(input_)
-    elif isinstance(input_, str) or isinstance(input_, PurePath):
-        if isinstance(input_, PurePath):
-            input_ = str(input_)
 
-        adapter = get_adapter(input_)
+    if isinstance(input_, str) or hasattr(input_, "__fspath__"):
+        # If input_ is a path-like object, open it and return the binary stream
+        uri = _filepath_from_path_or_filelike(input_)
+
+        adapter = get_adapter(uri)
         if adapter:
             cache_dir = get_config("cache")
             assert cache_dir is None or isinstance(cache_dir, str)
             if cache_dir:
                 stream, local_cache_file = get_local_cache_stream(
-                    input_, cache_dir
+                    uri, cache_dir, "ab", format="raw"
                 )
             else:
-                stream = BytesIO()
-                local_cache_file = None
+                stream, local_cache_file = BytesIO(), None
 
             if not local_cache_file:
-                logger.info(f"Retrieving {input_}")
-                adapter.read_to_stream(input_, stream)
+                logger.info(f"Retrieving {uri}")
+                adapter.read_to_stream(uri, stream)
                 logger.info("Retrieval complete")
             else:
                 logger.info(f"Using local cached file {local_cache_file}")
-            stream = _decompress(stream)
+
+            if cache_dir:
+                stream.close()
+                stream, _ = get_local_cache_stream(uri, cache_dir, "rb")
+            else:
+                stream.seek(0)
+
         else:
-            if not os.path.exists(input_):
-                raise InputNotFoundError(f"File {input_} does not exist")
+            if not os.path.exists(uri):
+                raise InputNotFoundError(f"File {uri} does not exist")
 
-            stream = _open(input_, "rb")
+            stream = _open(uri, "rb")
         return stream
-    elif isinstance(input_, BufferedIOBase):
-        return input_
 
-    raise ValueError(f"Unsupported input type: {type(input_)}")
+    if isinstance(input_, TextIOWrapper):
+        # If file_or_path is a TextIOWrapper, return its underlying binary buffer
+        return input_.buffer
+
+    if hasattr(input_, "readinto"):
+        # If file_or_path is a file-like object, return it as is
+        return _open(input_)  # type: ignore
+
+    raise TypeError(f"Unsupported input type: {type(input_)}")