Add Builder interface for creating .torrent files.

author nsf <no.smile.face@gmail.com>

Thu, 5 Jul 2012 16:44:54 +0000 (22:44 +0600)

committer nsf <no.smile.face@gmail.com>

Thu, 5 Jul 2012 16:44:54 +0000 (22:44 +0600)
author nsf <no.smile.face@gmail.com>
Thu, 5 Jul 2012 16:44:54 +0000 (22:44 +0600)
committer nsf <no.smile.face@gmail.com>
Thu, 5 Jul 2012 16:44:54 +0000 (22:44 +0600)
diff --git a/torrent/builder.go b/torrent/builder.go

new file mode 100644 (file)

index 0000000..95ed881
--- /dev/null
+++ b/torrent/builder.go
@@ -0,0 +1,493 @@
+package torrent
+
+import (
+       "github.com/nsf/libtorgo/bencode"
+       "path/filepath"
+       "errors"
+       "hash"
+       "crypto/sha1"
+       "time"
+       "sort"
+       "io"
+       "os"
+)
+
+type Builder struct {
+       filesmap      map[string]bool
+       files         []file
+       files_size    int64
+       name          string
+       piece_length  int64
+       pieces        []byte
+       private       bool
+       announce_list [][]string
+       creation_date time.Time
+       comment       string
+       created_by    string
+       encoding      string
+       urls          []string
+}
+
+// Adds a file to the builder queue. You may add one or more files.
+func (b *Builder) AddFile(filename string) {
+       if b.filesmap == nil {
+               b.filesmap = make(map[string]bool)
+       }
+
+       filename, err := filepath.Abs(filename)
+       if err != nil {
+               panic(err)
+       }
+       b.filesmap[filename] = true
+}
+
+// Defines a name of the future torrent file. For single file torrents it's the
+// recommended name of the contained file. For multiple files torrents it's the
+// recommended name of the directory in which all of them will be
+// stored. Calling this function is not required. In case if no name was
+// specified, the builder will try to automatically assign it. It will use the
+// name of the file if there is only one file in the queue or it will try to
+// find the rightmost common directory of all the queued files and use its name as
+// a torrent name. In case if name cannot be assigned automatically, it will use
+// "unknown" as a torrent name.
+func (b *Builder) SetName(name string) {
+       b.name = name
+}
+
+// Sets the length of a piece in the torrent file in bytes. The default is
+// 256kb.
+func (b *Builder) SetPieceLength(length int64) {
+       b.piece_length = length
+}
+
+// Sets the "private" flag. The default is false.
+func (b *Builder) SetPrivate(v bool) {
+       b.private = v
+}
+
+// Add announce group. TODO: better explanation.
+func (b *Builder) AddAnnounceGroup(group []string) {
+       b.announce_list = append(b.announce_list, group)
+}
+
+// Sets creation date. The default is time.Now() when the .Build method was
+// called.
+func (b *Builder) SetCreationDate(date time.Time) {
+       b.creation_date = date
+}
+
+// Sets the comment. The default is no comment.
+func (b *Builder) SetComment(comment string) {
+       b.comment = comment
+}
+
+// Sets the "created by" parameter. The default is "libtorgo".
+func (b *Builder) SetCreatedBy(createdby string) {
+       b.created_by = createdby
+}
+
+// Sets the "encoding" parameter. The default is "UTF-8".
+func (b *Builder) SetEncoding(encoding string) {
+       b.encoding = encoding
+}
+
+func (b *Builder) AddURL(url string) {
+       b.urls = append(b.urls, url)
+}
+
+// Status report structure for Builder.Build method.
+type BuilderStatus struct {
+       Size int64
+       Hashed int64
+}
+
+// Builds a torrent file. This function does everything in a separate goroutine
+// and uses up to 'nworkers' of goroutines to perform SHA1 hashing. Therefore it
+// will return almost immedately. It returns two channels, the first one is for
+// completion awaiting, the second one is for getting status reports. You should
+// not call any other methods while the builder is working on the torrent file.
+func (b *Builder) Build(w io.Writer, nworkers int) (<-chan error, <-chan BuilderStatus) {
+       if nworkers <= 0 {
+               nworkers = 1
+       }
+
+       completion := make(chan error)
+       status := make(chan BuilderStatus)
+
+       go func() {
+               b.set_defaults()
+               err := b.prepare_files()
+               if err != nil {
+                       completion <- err
+                       return
+               }
+
+               // prepare workers
+               workers := make([]*worker, nworkers)
+               free_workers := make(chan *worker, nworkers)
+               for i := 0; i < nworkers; i++ {
+                       workers[i] = new_worker(free_workers)
+               }
+               stop_workers := func() {
+                       for _, w := range workers {
+                               w.stop()
+                       }
+                       for _, w := range workers {
+                               w.wait_for_stop()
+                       }
+               }
+
+               // prepare files for reading
+               fr := files_reader{files: b.files}
+               npieces := b.files_size / b.piece_length + 1
+               b.pieces = make([]byte, 20 * npieces)
+               bstatus := BuilderStatus{Size: b.files_size}
+
+               // read all the pieces passing them to workers for hashing
+               var data []byte
+               for i := int64(0); i < npieces; i++ {
+                       if data == nil {
+                               data = make([]byte, b.piece_length)
+                       }
+
+                       nr, err := fr.Read(data)
+                       if err != nil {
+                               // EOF is not an eror if it was the last piece
+                               if err == io.EOF {
+                                       if i != npieces-1 {
+                                               stop_workers()
+                                               completion <- err
+                                               return
+                                       }
+                               } else {
+                                       stop_workers()
+                                       completion <- err
+                                       return
+                               }
+                       }
+
+                       // cut the data slice to the amount of actual data read
+                       data = data[:nr]
+                       w := <-free_workers
+                       data = w.queue(data, b.pieces[20*i:20*i+20])
+
+                       // update and try to send the status report
+                       if data != nil {
+                               bstatus.Hashed += int64(len(data))
+                               data = data[:cap(data)]
+
+                               select {
+                               case status <- bstatus:
+                               default:
+                               }
+                       }
+               }
+               stop_workers()
+
+               // at this point the hash was calculated and we're ready to
+               // write the torrent file
+               err = b.write_torrent(w)
+               if err != nil {
+                       completion <- err
+                       return
+               }
+               completion <- nil
+       }()
+       return completion, status
+}
+
+//----------------------------------------------------------------------------
+// worker
+//----------------------------------------------------------------------------
+
+type worker struct {
+       msgbox chan bool
+       hash hash.Hash
+
+       // request
+       sha1 []byte
+       data []byte
+}
+
+// returns existing 'data'
+func (w *worker) queue(data, sha1 []byte) []byte {
+       d := w.data
+       w.data = data
+       w.sha1 = sha1
+       w.msgbox <- false
+       return d
+}
+
+func (w *worker) stop() {
+       w.msgbox <- true
+}
+
+func (w *worker) wait_for_stop() {
+       <-w.msgbox
+}
+
+func new_worker(out chan<- *worker) *worker {
+       w := &worker{
+               msgbox: make(chan bool),
+               hash: sha1.New(),
+       }
+       go func() {
+               var sha1 [20]byte
+               for {
+                       if <-w.msgbox {
+                               w.msgbox <- true
+                               return
+                       }
+                       w.hash.Reset()
+                       w.hash.Write(w.data)
+                       w.hash.Sum(sha1[:0])
+                       copy(w.sha1, sha1[:])
+                       out <- w
+               }
+       }()
+       out <- w
+       return w
+}
+
+//----------------------------------------------------------------------------
+// files_reader
+//----------------------------------------------------------------------------
+
+type files_reader struct {
+       files []file
+       cur int
+       curfile *os.File
+       off int64
+}
+
+func (f *files_reader) Read(data []byte) (int, error) {
+       if f.cur >= len(f.files) {
+               return 0, io.EOF
+       }
+
+       if len(data) == 0 {
+               return 0, nil
+       }
+
+       read := 0
+       for len(data) > 0 {
+               file := &f.files[f.cur]
+               if f.curfile == nil {
+                       var err error
+                       f.curfile, err = os.Open(file.abspath)
+                       if err != nil {
+                               return read, err
+                       }
+               }
+
+               // we need to read up to 'len(data)' bytes from current file
+               n := int64(len(data))
+
+               // unless there is not enough data in this file
+               if file.size - f.off < n {
+                       n = file.size - f.off
+               }
+
+               // if there is no data in this file, try next one
+               if n == 0 {
+                       err := f.curfile.Close()
+                       if err != nil {
+                               return read, err
+                       }
+
+                       f.curfile = nil
+                       f.off = 0
+                       f.cur++
+                       if f.cur >= len(f.files) {
+                               return read, io.EOF
+                       }
+                       continue
+               }
+
+               // read, handle errors
+               nr, err := f.curfile.Read(data[:n])
+               read += nr
+               f.off += int64(nr)
+               if err != nil {
+                       return read, err
+               }
+
+               // ok, we've read nr bytes out of len(data), cut the data slice
+               data = data[nr:]
+       }
+
+       return read, nil
+}
+
+// splits path into components (dirs and files), works only on absolute paths
+func split_path(path string) []string {
+       var dir, file string
+       s := make([]string, 0, 5)
+
+       dir = path
+       for {
+               dir, file = filepath.Split(filepath.Clean(dir))
+               if file == "" {
+                       break
+               }
+               s = append(s, file)
+       }
+
+       // reverse the slice
+       for i, n := 0, len(s) / 2; i < n; i++ {
+               i2 := len(s) - i - 1
+               s[i], s[i2] = s[i2], s[i]
+       }
+
+       return s
+}
+
+func (b *Builder) set_defaults() {
+       if b.piece_length == 0 {
+               b.piece_length = 256*1024
+       }
+
+       if b.creation_date.IsZero() {
+               b.creation_date = time.Now()
+       }
+
+       if b.created_by == "" {
+               b.created_by = "libtorgo"
+       }
+
+       if b.encoding == "" {
+               b.encoding = "UTF-8"
+       }
+}
+
+type file struct {
+       abspath string
+       splitpath []string
+       size int64
+}
+
+type file_slice []file
+func (s file_slice) Len() int { return len(s) }
+func (s file_slice) Less(i, j int) bool { return s[i].abspath < s[j].abspath }
+func (s file_slice) Swap(i, j int) { s[i], s[j] = s[j], s[i] }
+
+// 1. Creates a sorted slice of files 'b.files' out of 'b.filesmap'.
+// 2. Searches for a common rightmost dir and strips that part from 'splitpath'
+// of each file.
+// 3. In case if the 'b.name' was empty, assigns an automatic value to it.
+// 4. Calculates the total size of all the files 'b.files_size'
+func (b *Builder) prepare_files() error {
+       if len(b.filesmap) == 0 {
+               return errors.New("no files were queued")
+       }
+
+       const non_regular = os.ModeDir | os.ModeSymlink |
+               os.ModeDevice | os.ModeNamedPipe | os.ModeSocket
+
+       // convert a map to a slice, calculate sizes and split paths
+       b.files_size = 0
+       b.files = make([]file, 0, 10)
+       for f, _ := range b.filesmap {
+               var file file
+               fi, err := os.Stat(f)
+               if err != nil {
+                       return err
+               }
+
+               if fi.Mode() & non_regular != 0 {
+                       return errors.New(f + " is not a regular file")
+               }
+
+               file.abspath = f
+               file.splitpath = split_path(f)
+               file.size = fi.Size()
+               b.files = append(b.files, file)
+
+               b.files_size += file.size
+       }
+
+       // find the rightmost common directory
+       if len(b.files) == 1 {
+               if b.name == "" {
+                       sp := b.files[0].splitpath
+                       b.name = sp[len(sp)-1]
+               }
+       } else {
+               common := b.files[0].splitpath
+               for _, f := range b.files {
+                       if len(common) > len(f.splitpath) {
+                               common = common[:len(f.splitpath)]
+                       }
+
+                       for i, n := 0, len(common); i < n; i++ {
+                               if common[i] != f.splitpath[i] {
+                                       common = common[:i]
+                                       break
+                               }
+                       }
+
+                       if len(common) == 0 {
+                               break
+                       }
+               }
+
+               if len(common) == 0 {
+                       return errors.New("no common rightmost folder was found for a set of queued files")
+               }
+
+               // found the common folder, let's strip that part from splitpath
+               // and setup the name if it wasn't provided manually
+               if b.name == "" {
+                       b.name = common[len(common)-1]
+               }
+
+               lcommon := len(common)
+               for _, f := range b.files {
+                       f.splitpath = f.splitpath[lcommon:]
+               }
+
+               // and finally sort the files
+               sort.Sort(file_slice(b.files))
+       }
+
+       b.filesmap = nil
+       return nil
+}
+
+func (b *Builder) write_torrent(w io.Writer) error {
+       var td torrent_data
+       td.Announce = b.announce_list[0][0]
+       if len(b.announce_list) != 1 || len(b.announce_list[0]) != 1 {
+               td.AnnounceList = b.announce_list
+       }
+       td.CreationDate = b.creation_date.Unix()
+       td.Comment = b.comment
+       td.CreatedBy = b.created_by
+       td.Encoding = b.encoding
+       switch {
+       case len(b.urls) == 0:
+       case len(b.urls) == 1:
+               td.URLList = b.urls[0]
+       default:
+               td.URLList = b.urls
+       }
+
+       td.Info.PieceLength = b.piece_length
+       td.Info.Pieces = b.pieces
+       td.Info.Name = b.name
+       if len(b.files) == 1 {
+               td.Info.Length = b.files[0].size
+       } else {
+               td.Info.Files = make([]torrent_info_file, len(b.files))
+               for i, f := range b.files {
+                       td.Info.Files[i] = torrent_info_file{
+                               Path: f.splitpath,
+                               Length: f.size,
+                       }
+               }
+       }
+       td.Info.Private = b.private
+
+       e := bencode.NewEncoder(w)
+       return e.Encode(&td)
+}
+\ No newline at end of file
author	nsf <no.smile.face@gmail.com>
	Thu, 5 Jul 2012 16:44:54 +0000 (22:44 +0600)
committer	nsf <no.smile.face@gmail.com>
	Thu, 5 Jul 2012 16:44:54 +0000 (22:44 +0600)