FedP2P/torrent.go

806 lines
18 KiB
Go
Raw Normal View History

package torrent
import (
"container/heap"
"expvar"
"fmt"
"io"
"log"
"math/rand"
"net"
"sort"
"sync"
2014-12-02 06:40:18 +08:00
"time"
2014-08-21 19:08:56 +08:00
"github.com/anacrolix/missinggo"
"github.com/anacrolix/missinggo/pubsub"
"github.com/bradfitz/iter"
2015-04-28 13:24:17 +08:00
"github.com/anacrolix/torrent/bencode"
"github.com/anacrolix/torrent/metainfo"
pp "github.com/anacrolix/torrent/peer_protocol"
"github.com/anacrolix/torrent/tracker"
)
2015-03-20 07:52:01 +08:00
func (t *torrent) pieceNumPendingBytes(index int) (count pp.Integer) {
2015-03-10 23:41:21 +08:00
if t.pieceComplete(index) {
return 0
}
piece := &t.Pieces[index]
pieceLength := t.pieceLength(index)
if !piece.EverHashed {
return pieceLength
}
for i, pending := range piece.PendingChunkSpecs {
if pending {
count += chunkIndexSpec(i, pieceLength, t.chunkSize).Length
}
}
return
}
type peersKey struct {
IPBytes string
Port int
}
2015-02-24 22:34:57 +08:00
// Is not aware of Client. Maintains state of torrent for with-in a Client.
type torrent struct {
stateMu sync.Mutex
closing chan struct{}
// Closed when no more network activity is desired. This includes
// announcing, and communicating with peers.
ceasingNetworking chan struct{}
InfoHash InfoHash
Pieces []piece
// Values are the piece indices that changed.
pieceStateChanges *pubsub.PubSub
chunkSize pp.Integer
// Chunks that are wanted before all others. This is for
// responsive/streaming readers that want to unblock ASAP.
urgent map[request]struct{}
// Total length of the torrent in bytes. Stored because it's not O(1) to
// get this from the info dict.
length int64
data Data
2015-04-28 13:24:17 +08:00
// The info dict. Nil if we don't have it (yet).
2015-02-26 19:17:58 +08:00
Info *metainfo.Info
// Active peer connections, running message stream loops.
Conns []*connection
// Set of addrs to which we're attempting to connect. Connections are
// half-open until all handshakes are completed.
HalfOpen map[string]struct{}
// Reserve of peers to connect to. A peer can be both here and in the
// active connections if were told about the peer after connecting with
// them. That encourages us to reconnect to peers that are well known.
Peers map[peersKey]Peer
wantPeers sync.Cond
// BEP 12 Multitracker Metadata Extension. The tracker.Client instances
2015-02-24 22:34:57 +08:00
// mirror their respective URLs from the announce-list metainfo key.
Trackers [][]tracker.Client
// Name used if the info name isn't available.
DisplayName string
// The bencoded bytes of the info dict.
MetaData []byte
// Each element corresponds to the 16KiB metadata pieces. If true, we have
// received that piece.
metadataHave []bool
// Closed when .Info is set.
gotMetainfo chan struct{}
connPiecePriorites sync.Pool
}
var (
piecePrioritiesReused = expvar.NewInt("piecePrioritiesReused")
piecePrioritiesNew = expvar.NewInt("piecePrioritiesNew")
)
func (t *torrent) newConnPiecePriorities() []int {
_ret := t.connPiecePriorites.Get()
if _ret != nil {
piecePrioritiesReused.Add(1)
return _ret.([]int)
}
piecePrioritiesNew.Add(1)
return rand.Perm(t.numPieces())
2014-06-28 17:38:31 +08:00
}
2015-03-10 23:41:21 +08:00
func (t *torrent) pieceComplete(piece int) bool {
// TODO: This is called when setting metadata, and before storage is
// assigned, which doesn't seem right.
return t.data != nil && t.data.PieceComplete(piece)
}
func (t *torrent) numConnsUnchoked() (num int) {
for _, c := range t.Conns {
if !c.PeerChoked {
num++
}
}
return
}
// There's a connection to that address already.
func (t *torrent) addrActive(addr string) bool {
if _, ok := t.HalfOpen[addr]; ok {
return true
}
for _, c := range t.Conns {
if c.remoteAddr().String() == addr {
return true
}
}
return false
}
func (t *torrent) worstConns(cl *Client) (wcs *worstConns) {
wcs = &worstConns{
c: make([]*connection, 0, len(t.Conns)),
2015-06-16 14:57:47 +08:00
t: t,
cl: cl,
}
for _, c := range t.Conns {
select {
case <-c.closing:
default:
wcs.c = append(wcs.c, c)
}
}
return
}
func (t *torrent) ceaseNetworking() {
t.stateMu.Lock()
defer t.stateMu.Unlock()
select {
case <-t.ceasingNetworking:
return
default:
}
close(t.ceasingNetworking)
for _, c := range t.Conns {
c.Close()
}
}
func (t *torrent) addPeer(p Peer, cl *Client) {
cl.openNewConns(t)
if len(t.Peers) >= torrentPeersHighWater {
return
}
key := peersKey{string(p.IP), p.Port}
if _, ok := t.Peers[key]; ok {
return
}
t.Peers[key] = p
peersAddedBySource.Add(string(p.Source), 1)
cl.openNewConns(t)
}
func (t *torrent) invalidateMetadata() {
t.MetaData = nil
t.metadataHave = nil
2014-06-28 17:38:31 +08:00
t.Info = nil
}
2015-03-20 07:52:01 +08:00
func (t *torrent) saveMetadataPiece(index int, data []byte) {
2014-06-28 17:38:31 +08:00
if t.haveInfo() {
return
}
if index >= len(t.metadataHave) {
log.Printf("%s: ignoring metadata piece %d", t, index)
return
}
2014-06-28 17:38:31 +08:00
copy(t.MetaData[(1<<14)*index:], data)
t.metadataHave[index] = true
}
func (t *torrent) metadataPieceCount() int {
2014-06-28 17:38:31 +08:00
return (len(t.MetaData) + (1 << 14) - 1) / (1 << 14)
}
func (t *torrent) haveMetadataPiece(piece int) bool {
if t.haveInfo() {
return (1<<14)*piece < len(t.MetaData)
} else {
2014-08-25 20:15:45 +08:00
return piece < len(t.metadataHave) && t.metadataHave[piece]
}
}
2014-06-28 17:38:31 +08:00
func (t *torrent) metadataSizeKnown() bool {
return t.MetaData != nil
}
func (t *torrent) metadataSize() int {
return len(t.MetaData)
}
func infoPieceHashes(info *metainfo.Info) (ret []string) {
for i := 0; i < len(info.Pieces); i += 20 {
ret = append(ret, string(info.Pieces[i:i+20]))
}
return
}
// Called when metadata for a torrent becomes available.
func (t *torrent) setMetadata(md *metainfo.Info, infoBytes []byte, eventLocker sync.Locker) (err error) {
2015-06-02 22:17:58 +08:00
err = validateInfo(md)
if err != nil {
err = fmt.Errorf("bad info: %s", err)
return
}
t.Info = md
t.length = 0
for _, f := range t.Info.UpvertedFiles() {
t.length += f.Length
}
2014-06-28 17:38:31 +08:00
t.MetaData = infoBytes
t.metadataHave = nil
hashes := infoPieceHashes(md)
t.Pieces = make([]piece, len(hashes))
for i, hash := range hashes {
piece := &t.Pieces[i]
piece.Event.L = eventLocker
piece.noPendingWrites.L = &piece.pendingWritesMutex
2015-08-03 22:29:01 +08:00
missinggo.CopyExact(piece.Hash[:], hash)
2014-06-28 17:38:31 +08:00
}
for _, conn := range t.Conns {
t.initRequestOrdering(conn)
if err := conn.setNumPieces(t.numPieces()); err != nil {
log.Printf("closing connection: %s", err)
conn.Close()
}
}
return
}
func (t *torrent) setStorage(td Data) (err error) {
if t.data != nil {
t.data.Close()
2015-02-27 09:45:55 +08:00
}
t.data = td
2014-06-28 17:38:31 +08:00
return
}
func (t *torrent) haveAllMetadataPieces() bool {
2014-06-28 17:38:31 +08:00
if t.haveInfo() {
return true
}
if t.metadataHave == nil {
return false
}
2014-06-28 17:38:31 +08:00
for _, have := range t.metadataHave {
if !have {
return false
}
}
return true
}
func (t *torrent) setMetadataSize(bytes int64, cl *Client) {
if t.haveInfo() {
// We already know the correct metadata size.
return
}
if bytes <= 0 || bytes > 10000000 { // 10MB, pulled from my ass.
log.Printf("received bad metadata size: %d", bytes)
return
}
if t.MetaData != nil && len(t.MetaData) == int(bytes) {
return
}
t.MetaData = make([]byte, bytes)
2014-06-28 17:38:31 +08:00
t.metadataHave = make([]bool, (bytes+(1<<14)-1)/(1<<14))
for _, c := range t.Conns {
cl.requestPendingMetadata(t, c)
}
}
2015-03-09 14:35:29 +08:00
// The current working name for the torrent. Either the name in the info dict,
// or a display name given such as by the dn value in a magnet link, or "".
func (t *torrent) Name() string {
if t.haveInfo() {
return t.Info.Name
}
2015-08-19 11:29:01 +08:00
return t.DisplayName
}
func (t *torrent) pieceState(index int) (ret PieceState) {
p := &t.Pieces[index]
ret.Priority = p.Priority
if t.pieceComplete(index) {
ret.Complete = true
}
if p.QueuedForHash || p.Hashing {
ret.Checking = true
}
2015-07-17 19:07:01 +08:00
if !ret.Complete && t.piecePartiallyDownloaded(index) {
ret.Partial = true
}
return
}
2014-06-28 17:38:31 +08:00
func (t *torrent) metadataPieceSize(piece int) int {
return metadataPieceSize(len(t.MetaData), piece)
}
func (t *torrent) newMetadataExtensionMessage(c *connection, msgType int, piece int, data []byte) pp.Message {
2014-06-28 17:38:31 +08:00
d := map[string]int{
"msg_type": msgType,
"piece": piece,
}
if data != nil {
d["total_size"] = len(t.MetaData)
}
p, err := bencode.Marshal(d)
if err != nil {
panic(err)
}
return pp.Message{
Type: pp.Extended,
ExtendedID: byte(c.PeerExtensionIDs["ut_metadata"]),
ExtendedPayload: append(p, data...),
}
}
func (t *torrent) pieceStateRuns() (ret []PieceStateRun) {
rle := missinggo.NewRunLengthEncoder(func(el interface{}, count uint64) {
ret = append(ret, PieceStateRun{
PieceState: el.(PieceState),
Length: int(count),
})
})
for index := range t.Pieces {
rle.Append(t.pieceState(index), 1)
}
rle.Flush()
return
2015-01-26 17:52:59 +08:00
}
// Produces a small string representing a PieceStateRun.
func pieceStateRunStatusChars(psr PieceStateRun) (ret string) {
ret = fmt.Sprintf("%d", psr.Length)
ret += func() string {
switch psr.Priority {
case PiecePriorityNext:
return "N"
case PiecePriorityNormal:
return "."
case PiecePriorityReadahead:
return "R"
case PiecePriorityNow:
return "!"
default:
return ""
2015-01-26 17:52:59 +08:00
}
}()
if psr.Checking {
ret += "H"
}
if psr.Partial {
ret += "P"
2015-01-26 17:52:59 +08:00
}
if psr.Complete {
ret += "C"
2015-01-26 17:52:59 +08:00
}
return
}
2015-06-16 14:57:47 +08:00
func (t *torrent) writeStatus(w io.Writer, cl *Client) {
2014-07-09 22:26:58 +08:00
fmt.Fprintf(w, "Infohash: %x\n", t.InfoHash)
fmt.Fprintf(w, "Metadata length: %d\n", t.metadataSize())
2015-06-29 22:46:24 +08:00
if !t.haveInfo() {
fmt.Fprintf(w, "Metadata have: ")
for _, h := range t.metadataHave {
fmt.Fprintf(w, "%c", func() rune {
if h {
return 'H'
} else {
return '.'
}
}())
}
fmt.Fprintln(w)
}
2014-08-25 20:15:45 +08:00
fmt.Fprintf(w, "Piece length: %s\n", func() string {
if t.haveInfo() {
return fmt.Sprint(t.usualPieceSize())
2014-08-25 20:15:45 +08:00
} else {
return "?"
}
}())
if t.haveInfo() {
2015-09-25 20:05:32 +08:00
fmt.Fprintf(w, "Num Pieces: %d\n", t.numPieces())
fmt.Fprint(w, "Piece States:")
for _, psr := range t.pieceStateRuns() {
w.Write([]byte(" "))
w.Write([]byte(pieceStateRunStatusChars(psr)))
2014-09-14 01:43:11 +08:00
}
fmt.Fprintln(w)
}
fmt.Fprintf(w, "Urgent:")
for req := range t.urgent {
2015-05-15 06:41:42 +08:00
fmt.Fprintf(w, " %v", req)
}
fmt.Fprintln(w)
2014-11-21 14:07:42 +08:00
fmt.Fprintf(w, "Trackers: ")
for _, tier := range t.Trackers {
for _, tr := range tier {
fmt.Fprintf(w, "%q ", tr.String())
}
}
fmt.Fprintf(w, "\n")
fmt.Fprintf(w, "Pending peers: %d\n", len(t.Peers))
fmt.Fprintf(w, "Half open: %d\n", len(t.HalfOpen))
2014-08-22 15:33:17 +08:00
fmt.Fprintf(w, "Active peers: %d\n", len(t.Conns))
sort.Sort(&worstConns{
2015-06-16 14:57:47 +08:00
c: t.Conns,
t: t,
cl: cl,
})
2015-06-29 22:46:24 +08:00
for i, c := range t.Conns {
fmt.Fprintf(w, "%2d. ", i+1)
2015-03-12 17:06:23 +08:00
c.WriteStatus(w, t)
}
}
func (t *torrent) String() string {
s := t.Name()
if s == "" {
s = fmt.Sprintf("%x", t.InfoHash)
}
return s
}
func (t *torrent) haveInfo() bool {
2015-06-29 22:46:24 +08:00
return t != nil && t.Info != nil
}
// TODO: Include URIs that weren't converted to tracker clients.
func (t *torrent) announceList() (al [][]string) {
for _, tier := range t.Trackers {
var l []string
for _, tr := range tier {
l = append(l, tr.URL())
}
al = append(al, l)
}
return
}
2015-03-20 07:52:01 +08:00
// Returns a run-time generated MetaInfo that includes the info bytes and
// announce-list as currently known to the client.
func (t *torrent) MetaInfo() *metainfo.MetaInfo {
if t.MetaData == nil {
panic("info bytes not set")
}
return &metainfo.MetaInfo{
Info: metainfo.InfoEx{
2015-02-26 19:17:58 +08:00
Info: *t.Info,
Bytes: t.MetaData,
},
CreationDate: time.Now().Unix(),
Comment: "dynamic metainfo from client",
CreatedBy: "go.torrent",
AnnounceList: t.announceList(),
}
}
func (t *torrent) bytesLeft() (left int64) {
if !t.haveInfo() {
return -1
}
2015-03-10 23:39:01 +08:00
for i := 0; i < t.numPieces(); i++ {
2015-03-20 07:52:01 +08:00
left += int64(t.pieceNumPendingBytes(i))
}
return
}
func (t *torrent) piecePartiallyDownloaded(index int) bool {
pendingBytes := t.pieceNumPendingBytes(index)
return pendingBytes != 0 && pendingBytes != t.pieceLength(index)
}
2015-03-08 14:28:14 +08:00
func numChunksForPiece(chunkSize int, pieceSize int) int {
return (pieceSize + chunkSize - 1) / chunkSize
}
func (t *torrent) usualPieceSize() int {
2014-06-28 17:38:31 +08:00
return int(t.Info.PieceLength)
}
func (t *torrent) lastPieceSize() int {
2015-03-20 20:52:53 +08:00
return int(t.pieceLength(t.numPieces() - 1))
}
func (t *torrent) numPieces() int {
2015-03-12 17:06:23 +08:00
return t.Info.NumPieces()
}
func (t *torrent) numPiecesCompleted() (num int) {
2015-03-10 23:41:21 +08:00
for i := range iter.N(t.Info.NumPieces()) {
if t.pieceComplete(i) {
num++
}
}
return
}
func (t *torrent) Length() int64 {
2014-08-24 01:09:02 +08:00
return t.length
}
func (t *torrent) isClosed() bool {
select {
case <-t.closing:
return true
default:
return false
}
}
func (t *torrent) close() (err error) {
if t.isClosed() {
return
}
t.ceaseNetworking()
close(t.closing)
if c, ok := t.data.(io.Closer); ok {
c.Close()
}
for _, conn := range t.Conns {
conn.Close()
}
t.pieceStateChanges.Close()
return
}
2014-04-16 19:13:44 +08:00
func (t *torrent) requestOffset(r request) int64 {
return torrentRequestOffset(t.Length(), int64(t.usualPieceSize()), r)
}
// Return the request that would include the given offset into the torrent
// data. Returns !ok if there is no such request.
2014-04-16 19:13:44 +08:00
func (t *torrent) offsetRequest(off int64) (req request, ok bool) {
return torrentOffsetRequest(t.Length(), t.Info.PieceLength, int64(t.chunkSize), off)
}
func (t *torrent) writeChunk(piece int, begin int64, data []byte) (err error) {
2015-06-02 22:03:43 +08:00
n, err := t.data.WriteAt(data, int64(piece)*t.Info.PieceLength+begin)
if err == nil && n != len(data) {
err = io.ErrShortWrite
}
return
}
func (t *torrent) bitfield() (bf []bool) {
for i := range t.Pieces {
p := &t.Pieces[i]
// TODO: Check this logic.
bf = append(bf, p.EverHashed && p.numPendingChunks() == 0)
}
return
}
func (t *torrent) validOutgoingRequest(r request) bool {
if r.Index >= pp.Integer(t.Info.NumPieces()) {
return false
}
if r.Begin%t.chunkSize != 0 {
return false
}
if r.Length > t.chunkSize {
return false
}
pieceLength := t.pieceLength(int(r.Index))
if r.Begin+r.Length > pieceLength {
return false
}
return r.Length == t.chunkSize || r.Begin+r.Length == pieceLength
}
func (t *torrent) pieceChunks(piece int) (css []chunkSpec) {
css = make([]chunkSpec, 0, (t.pieceLength(piece)+t.chunkSize-1)/t.chunkSize)
var cs chunkSpec
2015-03-20 20:52:53 +08:00
for left := t.pieceLength(piece); left != 0; left -= cs.Length {
cs.Length = left
if cs.Length > t.chunkSize {
cs.Length = t.chunkSize
}
css = append(css, cs)
cs.Begin += cs.Length
}
return
}
func (t *torrent) pendAllChunkSpecs(pieceIndex int) {
piece := &t.Pieces[pieceIndex]
if piece.PendingChunkSpecs == nil {
// Allocate to exact size.
piece.PendingChunkSpecs = make([]bool, (t.pieceLength(pieceIndex)+t.chunkSize-1)/t.chunkSize)
}
// Pend all the chunks.
pcss := piece.PendingChunkSpecs
for i := range pcss {
pcss[i] = true
}
return
}
type Peer struct {
Id [20]byte
IP net.IP
Port int
Source peerSource
2015-03-18 15:37:26 +08:00
// Peer is known to support encryption.
SupportsEncryption bool
}
2015-03-20 20:52:53 +08:00
func (t *torrent) pieceLength(piece int) (len_ pp.Integer) {
if int(piece) == t.numPieces()-1 {
2014-08-24 01:09:02 +08:00
len_ = pp.Integer(t.Length() % t.Info.PieceLength)
}
if len_ == 0 {
2014-06-28 17:38:31 +08:00
len_ = pp.Integer(t.Info.PieceLength)
}
return
}
func (t *torrent) hashPiece(piece pp.Integer) (ps pieceSum) {
hash := pieceHash.New()
p := &t.Pieces[piece]
p.pendingWritesMutex.Lock()
for p.pendingWrites != 0 {
p.noPendingWrites.Wait()
}
p.pendingWritesMutex.Unlock()
pl := t.Info.Piece(int(piece)).Length()
n, err := t.data.WriteSectionTo(hash, int64(piece)*t.Info.PieceLength, pl)
if err != nil {
if err != io.ErrUnexpectedEOF {
log.Printf("error hashing piece with %T: %s", t.data, err)
}
return
}
if n != pl {
panic("lame")
}
2015-08-03 22:29:01 +08:00
missinggo.CopyExact(ps[:], hash.Sum(nil))
return
}
2015-02-27 09:45:55 +08:00
func (t *torrent) haveAllPieces() bool {
if !t.haveInfo() {
return false
}
2015-03-10 23:41:21 +08:00
for i := range t.Pieces {
if !t.pieceComplete(i) {
return false
}
}
return true
}
func (me *torrent) haveAnyPieces() bool {
2015-03-10 23:41:21 +08:00
for i := range me.Pieces {
if me.pieceComplete(i) {
return true
}
}
return false
}
2014-09-14 01:50:15 +08:00
func (t *torrent) havePiece(index int) bool {
2015-03-10 23:41:21 +08:00
return t.haveInfo() && t.pieceComplete(index)
2014-09-14 01:50:15 +08:00
}
func (t *torrent) haveChunk(r request) bool {
if !t.haveInfo() {
2014-09-14 01:50:15 +08:00
return false
}
2015-07-17 19:07:01 +08:00
if t.pieceComplete(int(r.Index)) {
return true
}
p := &t.Pieces[r.Index]
2015-07-17 19:07:01 +08:00
if p.PendingChunkSpecs == nil {
return false
}
return !p.pendingChunk(r.chunkSpec, t.chunkSize)
}
func chunkIndex(cs chunkSpec, chunkSize pp.Integer) int {
return int(cs.Begin / chunkSize)
2014-09-14 01:50:15 +08:00
}
// TODO: This should probably be called wantPiece.
func (t *torrent) wantChunk(r request) bool {
if !t.wantPiece(int(r.Index)) {
return false
}
if t.Pieces[r.Index].pendingChunk(r.chunkSpec, t.chunkSize) {
return true
}
_, ok := t.urgent[r]
return ok
}
func (t *torrent) urgentChunkInPiece(piece int) bool {
2015-06-16 14:57:47 +08:00
p := pp.Integer(piece)
for req := range t.urgent {
2015-06-16 14:57:47 +08:00
if req.Index == p {
return true
}
}
return false
}
// TODO: This should be called wantPieceIndex.
func (t *torrent) wantPiece(index int) bool {
if !t.haveInfo() {
return false
}
p := &t.Pieces[index]
if p.QueuedForHash {
return false
}
if p.Hashing {
return false
}
if p.Priority == PiecePriorityNone {
if !t.urgentChunkInPiece(index) {
return false
}
}
// Put piece complete check last, since it's the slowest as it can involve
// calling out into external data stores.
return !t.pieceComplete(index)
}
2014-09-14 02:06:17 +08:00
func (t *torrent) connHasWantedPieces(c *connection) bool {
return c.pieceRequestOrder != nil && !c.pieceRequestOrder.Empty()
2014-09-14 02:06:17 +08:00
}
func (t *torrent) extentPieces(off, _len int64) (pieces []int) {
for i := off / int64(t.usualPieceSize()); i*int64(t.usualPieceSize()) < off+_len; i++ {
2014-09-14 02:06:17 +08:00
pieces = append(pieces, int(i))
}
return
}
func (t *torrent) worstBadConn(cl *Client) *connection {
wcs := t.worstConns(cl)
heap.Init(wcs)
for wcs.Len() != 0 {
c := heap.Pop(wcs).(*connection)
if c.UnwantedChunksReceived >= 6 && c.UnwantedChunksReceived > c.UsefulChunksReceived {
return c
}
if wcs.Len() >= (socketsPerTorrent+1)/2 {
// Give connections 1 minute to prove themselves.
if time.Since(c.completedHandshake) > time.Minute {
return c
}
}
}
return nil
}
func (t *torrent) publishPieceChange(piece int) {
cur := t.pieceState(piece)
p := &t.Pieces[piece]
if cur != p.PublicPieceState {
t.pieceStateChanges.Publish(piece)
}
p.PublicPieceState = cur
}