]> Sergey Matveev's repositories - feeder.git/blobdiff - cmd/env.rc
Compress WARCs
[feeder.git] / cmd / env.rc
index 1982a94bcf6e8588a8a655e61827843dcb932515..7c5874cfc1ec699530212e1127a17ef7d77c1101 100644 (file)
@@ -12,3 +12,12 @@ FEEDER_PARSE_JOBS=${FEEDER_PARSE_JOBS:-0}
 command -v sha512 >/dev/null && SHA512="sha512" || SHA512="sha512sum --binary"
 
 #MAILCAPS="${MAILCAPS:-$cmds/../contrib/mailcap}"
+
+_feeder_warc_compress() {
+    $HOME/work/tofuproxy/warc-extract.cmd -for-enzstd "$1" |
+    $HOME/work/tofuproxy/cmd/zstd/enzstd > "$1".zst
+    rm "$1"
+}
+
+FEEDER_WARC_COMPRESS=_feeder_warc_compress
+FEEDER_WARC_COMPRESS=: # do not compress