From 2b6bb12dcedc42190747064b2e0cb564c0f3c159 Mon Sep 17 00:00:00 2001 From: mokurin000 <1348292515a@gmail.com> Date: Mon, 11 Aug 2025 13:32:54 +0800 Subject: [PATCH] enhance: enable higher compression level --- utils/hash_userid.py | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/utils/hash_userid.py b/utils/hash_userid.py index c9b40cc..b2cfd6c 100644 --- a/utils/hash_userid.py +++ b/utils/hash_userid.py @@ -8,4 +8,6 @@ pl.scan_parquet(file).with_columns( pl.col("user_id").cast(pl.String).add("Lt2N5xgjJOqRsT5qVt7wWYw6SqOPZDI7") ).with_columns( pl_hash.col("user_id").chash.sha2_256().str.head(16) -).collect().write_parquet(file.replace(".parquet", "_pub.parquet")) +).collect().write_parquet( + file.replace(".parquet", "_pub.parquet"), compression="zstd", compression_level=15 +)