X-Git-Url: http://www.git.stargrave.org/?a=blobdiff_plain;f=cmd%2Fwarc-extract%2Fmain.go;h=d207273e2ee95f8d349ae3ae16607ce2bcf09c07;hb=HEAD;hp=85bc2731d930894e387ba7ae59a536a8ad4ecd77;hpb=6eee3c6c83cc535855e254426a90f7a2abba04ce;p=tofuproxy.git diff --git a/cmd/warc-extract/main.go b/cmd/warc-extract/main.go index 85bc273..c9d2a36 100644 --- a/cmd/warc-extract/main.go +++ b/cmd/warc-extract/main.go @@ -1,20 +1,17 @@ -/* -tofuproxy -- flexible HTTP proxy, TLS terminator, X.509 certificates - manager, WARC/Gemini browser -Copyright (C) 2021 Sergey Matveev - -This program is free software: you can redistribute it and/or modify -it under the terms of the GNU General Public License as published by -the Free Software Foundation, version 3 of the License. - -This program is distributed in the hope that it will be useful, -but WITHOUT ANY WARRANTY; without even the implied warranty of -MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the -GNU General Public License for more details. - -You should have received a copy of the GNU General Public License -along with this program. If not, see . -*/ +// warc-extract -- WARC files data extractor +// Copyright (C) 2021-2024 Sergey Matveev +// +// This program is free software: you can redistribute it and/or modify +// it under the terms of the GNU General Public License as published by +// the Free Software Foundation, version 3 of the License. +// +// This program is distributed in the hope that it will be useful, +// but WITHOUT ANY WARRANTY; without even the implied warranty of +// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +// GNU General Public License for more details. +// +// You should have received a copy of the GNU General Public License +// along with this program. If not, see . package main @@ -35,10 +32,12 @@ import ( func main() { uri := flag.String("uri", "", "URI to extract, if specified") hdr := flag.Bool("hdr", false, "Also extract WARC's header") - idx := flag.Bool("idx", false, "Save WARC indexes") + idx := flag.Bool("idx", false, "Save WARC indices") recompress := flag.Bool("for-enzstd", false, "Output for enzstd utility") + unzstdPath := flag.String("unzstd", "cmd/zstd/unzstd", "Path to unzstd utility") flag.Parse() log.SetFlags(log.Lshortfile) + warc.UnZSTDPath = *unzstdPath if *recompress { var hdr bytes.Buffer @@ -90,7 +89,7 @@ func main() { } log.Println("added", p, len(warc.WARCs[p]), "URIs") if *idx { - if err := warc.SaveIndexes(); err != nil { + if err := warc.SaveIndices(); err != nil { log.Fatalln(err) } } @@ -118,5 +117,4 @@ func main() { io.Copy(os.Stdout, r) } } - return }