From e341105ef2deb8b92d5bcd6e5688cb9c9449a4d9 Mon Sep 17 00:00:00 2001 From: Hagen Wierstorf Date: Tue, 25 Jun 2024 13:39:30 +0200 Subject: [PATCH] DOC: Table.save() store hash for parquet files --- audformat/core/table.py | 10 ++++++++++ 1 file changed, 10 insertions(+) diff --git a/audformat/core/table.py b/audformat/core/table.py index 30924953..f79aa3df 100644 --- a/audformat/core/table.py +++ b/audformat/core/table.py @@ -586,6 +586,16 @@ def save( Existing files will be overwritten. + When using ``"parquet"`` as ``storage_format`` + a hash, + based on the content of the table, + is stored under the key ``b"hash"`` + in the metadata of the schema of the parquet file. + This provides a deterministic hash, + as md5 sums of parquet files + can be different + for the same content. + Args: path: file path without extension storage_format: storage format of table.