sync.go 11.4 KB
Newer Older
F
Felix Lange 已提交
1
// Copyright 2015 The go-ethereum Authors
2
// This file is part of the go-ethereum library.
F
Felix Lange 已提交
3
//
4
// The go-ethereum library is free software: you can redistribute it and/or modify
F
Felix Lange 已提交
5 6 7 8
// it under the terms of the GNU Lesser General Public License as published by
// the Free Software Foundation, either version 3 of the License, or
// (at your option) any later version.
//
9
// The go-ethereum library is distributed in the hope that it will be useful,
F
Felix Lange 已提交
10
// but WITHOUT ANY WARRANTY; without even the implied warranty of
11
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
F
Felix Lange 已提交
12 13 14
// GNU Lesser General Public License for more details.
//
// You should have received a copy of the GNU Lesser General Public License
15
// along with the go-ethereum library. If not, see <http://www.gnu.org/licenses/>.
F
Felix Lange 已提交
16

17 18 19
package eth

import (
20
	"math/big"
21
	"math/rand"
22
	"sync/atomic"
23 24
	"time"

25
	"github.com/ethereum/go-ethereum/common"
26
	"github.com/ethereum/go-ethereum/core/rawdb"
27
	"github.com/ethereum/go-ethereum/core/types"
28
	"github.com/ethereum/go-ethereum/eth/downloader"
29
	"github.com/ethereum/go-ethereum/eth/protocols/eth"
30
	"github.com/ethereum/go-ethereum/log"
31
	"github.com/ethereum/go-ethereum/p2p/enode"
32 33
)

34
const (
35
	forceSyncCycle      = 10 * time.Second // Time interval to force syncs, even if few peers are available
36
	defaultMinSyncPeers = 5                // Amount of peers desired to start syncing
37

38
	// This is the target size for the packs of transactions sent by txsyncLoop64.
39 40
	// A pack can get larger than this if a single transactions exceeds this size.
	txsyncPackSize = 100 * 1024
41 42
)

43
type txsync struct {
44
	p   *eth.Peer
45
	txs []*types.Transaction
46 47 48
}

// syncTransactions starts sending all currently pending transactions to the given peer.
49
func (h *handler) syncTransactions(p *eth.Peer) {
50 51 52 53 54 55
	// Assemble the set of transaction to broadcast or announce to the remote
	// peer. Fun fact, this is quite an expensive operation as it needs to sort
	// the transactions if the sorting is not cached yet. However, with a random
	// order, insertions could overflow the non-executable queues and get dropped.
	//
	// TODO(karalabe): Figure out if we could get away with random order somehow
56
	var txs types.Transactions
57
	pending, _ := h.txpool.Pending()
58
	for _, batch := range pending {
59 60
		txs = append(txs, batch...)
	}
61 62 63
	if len(txs) == 0 {
		return
	}
64 65 66
	// The eth/65 protocol introduces proper transaction announcements, so instead
	// of dripping transactions across multiple peers, just send the entire list as
	// an announcement and let the remote side decide what they need (likely nothing).
67
	if p.Version() >= eth.ETH65 {
68 69 70 71 72 73 74 75
		hashes := make([]common.Hash, len(txs))
		for i, tx := range txs {
			hashes[i] = tx.Hash()
		}
		p.AsyncSendPooledTransactionHashes(hashes)
		return
	}
	// Out of luck, peer is running legacy protocols, drop the txs over
76
	select {
77 78
	case h.txsyncCh <- &txsync{p: p, txs: txs}:
	case <-h.quitSync:
79 80 81
	}
}

82
// txsyncLoop64 takes care of the initial transaction sync for each new
83 84 85
// connection. When a new peer appears, we relay all currently pending
// transactions. In order to minimise egress bandwidth usage, we send
// the transactions in small packs to one peer at a time.
86 87
func (h *handler) txsyncLoop64() {
	defer h.wg.Done()
88

89
	var (
90
		pending = make(map[enode.ID]*txsync)
91 92 93 94
		sending = false               // whether a send is active
		pack    = new(txsync)         // the pack that is being sent
		done    = make(chan error, 1) // result of the send
	)
95

96 97
	// send starts a sending a pack of transactions from the sync.
	send := func(s *txsync) {
98
		if s.p.Version() >= eth.ETH65 {
99 100
			panic("initial transaction syncer running on eth/65+")
		}
101 102 103 104
		// Fill pack with transactions up to the target size.
		size := common.StorageSize(0)
		pack.p = s.p
		pack.txs = pack.txs[:0]
105 106 107 108 109 110 111
		for i := 0; i < len(s.txs) && size < txsyncPackSize; i++ {
			pack.txs = append(pack.txs, s.txs[i])
			size += s.txs[i].Size()
		}
		// Remove the transactions that will be sent.
		s.txs = s.txs[:copy(s.txs, s.txs[len(pack.txs):])]
		if len(s.txs) == 0 {
112
			delete(pending, s.p.Peer.ID())
113
		}
114 115 116
		// Send the pack in the background.
		s.p.Log().Trace("Sending batch of transactions", "count", len(pack.txs), "bytes", size)
		sending = true
117
		go func() { done <- pack.p.SendTransactions(pack.txs) }()
118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134
	}
	// pick chooses the next pending sync.
	pick := func() *txsync {
		if len(pending) == 0 {
			return nil
		}
		n := rand.Intn(len(pending)) + 1
		for _, s := range pending {
			if n--; n == 0 {
				return s
			}
		}
		return nil
	}

	for {
		select {
135 136
		case s := <-h.txsyncCh:
			pending[s.p.Peer.ID()] = s
137 138 139 140 141 142 143
			if !sending {
				send(s)
			}
		case err := <-done:
			sending = false
			// Stop tracking peers that cause send failures.
			if err != nil {
P
Péter Szilágyi 已提交
144
				pack.p.Log().Debug("Transaction send failed", "err", err)
145
				delete(pending, pack.p.Peer.ID())
146 147 148 149 150
			}
			// Schedule the next send.
			if s := pick(); s != nil {
				send(s)
			}
151
		case <-h.quitSync:
152 153 154 155 156
			return
		}
	}
}

157 158
// chainSyncer coordinates blockchain sync components.
type chainSyncer struct {
159
	handler     *handler
160 161 162 163 164 165 166 167 168
	force       *time.Timer
	forced      bool // true when force timer fired
	peerEventCh chan struct{}
	doneCh      chan error // non-nil when sync is running
}

// chainSyncOp is a scheduled sync operation.
type chainSyncOp struct {
	mode downloader.SyncMode
169
	peer *eth.Peer
170 171 172 173 174
	td   *big.Int
	head common.Hash
}

// newChainSyncer creates a chainSyncer.
175
func newChainSyncer(handler *handler) *chainSyncer {
176
	return &chainSyncer{
177
		handler:     handler,
178 179 180 181 182 183 184
		peerEventCh: make(chan struct{}),
	}
}

// handlePeerEvent notifies the syncer about a change in the peer set.
// This is called for new peers and every time a peer announces a new
// chain head.
185
func (cs *chainSyncer) handlePeerEvent(peer *eth.Peer) bool {
186 187 188
	select {
	case cs.peerEventCh <- struct{}{}:
		return true
189
	case <-cs.handler.quitSync:
190 191 192 193 194 195
		return false
	}
}

// loop runs in its own goroutine and launches the sync when necessary.
func (cs *chainSyncer) loop() {
196
	defer cs.handler.wg.Done()
197

198 199 200 201 202
	cs.handler.blockFetcher.Start()
	cs.handler.txFetcher.Start()
	defer cs.handler.blockFetcher.Stop()
	defer cs.handler.txFetcher.Stop()
	defer cs.handler.downloader.Terminate()
O
obscuren 已提交
203

204 205 206 207
	// The force timer lowers the peer count threshold down to one when it fires.
	// This ensures we'll always start sync even if there aren't enough peers.
	cs.force = time.NewTimer(forceSyncCycle)
	defer cs.force.Stop()
E
Egon Elbre 已提交
208

209
	for {
210 211 212 213 214 215 216 217 218 219 220 221
		if op := cs.nextSyncOp(); op != nil {
			cs.startSync(op)
		}
		select {
		case <-cs.peerEventCh:
			// Peer information changed, recheck.
		case <-cs.doneCh:
			cs.doneCh = nil
			cs.force.Reset(forceSyncCycle)
			cs.forced = false
		case <-cs.force.C:
			cs.forced = true
222

223
		case <-cs.handler.quitSync:
224 225 226
			// Disable all insertion on the blockchain. This needs to happen before
			// terminating the downloader because the downloader waits for blockchain
			// inserts, and these can take a long time to finish.
227 228
			cs.handler.chain.StopInsert()
			cs.handler.downloader.Terminate()
229 230 231
			if cs.doneCh != nil {
				<-cs.doneCh
			}
O
obscuren 已提交
232
			return
233 234 235 236
		}
	}
}

237 238 239 240
// nextSyncOp determines whether sync is required at this time.
func (cs *chainSyncer) nextSyncOp() *chainSyncOp {
	if cs.doneCh != nil {
		return nil // Sync already running.
241
	}
242

243
	// Ensure we're at minimum peer count.
244 245 246
	minPeers := defaultMinSyncPeers
	if cs.forced {
		minPeers = 1
247 248
	} else if minPeers > cs.handler.maxPeers {
		minPeers = cs.handler.maxPeers
249
	}
250
	if cs.handler.peers.Len() < minPeers {
251
		return nil
252
	}
253 254
	// We have enough peers, check TD
	peer := cs.handler.peers.ethPeerWithHighestTD()
255 256
	if peer == nil {
		return nil
257
	}
258
	mode, ourTD := cs.modeAndLocalHead()
259 260 261 262
	if mode == downloader.FastSync && atomic.LoadUint32(&cs.handler.snapSync) == 1 {
		// Fast sync via the snap protocol
		mode = downloader.SnapSync
	}
263 264 265 266 267 268 269
	op := peerToSyncOp(mode, peer)
	if op.td.Cmp(ourTD) <= 0 {
		return nil // We're in sync.
	}
	return op
}

270
func peerToSyncOp(mode downloader.SyncMode, p *eth.Peer) *chainSyncOp {
271 272 273 274 275
	peerHead, peerTD := p.Head()
	return &chainSyncOp{mode: mode, peer: p, td: peerTD, head: peerHead}
}

func (cs *chainSyncer) modeAndLocalHead() (downloader.SyncMode, *big.Int) {
276
	// If we're in fast sync mode, return that directly
277 278 279
	if atomic.LoadUint32(&cs.handler.fastSync) == 1 {
		block := cs.handler.chain.CurrentFastBlock()
		td := cs.handler.chain.GetTdByHash(block.Hash())
280 281
		return downloader.FastSync, td
	}
282 283
	// We are probably in full sync, but we might have rewound to before the
	// fast sync pivot, check if we should reenable
284 285 286 287
	if pivot := rawdb.ReadLastPivotNumber(cs.handler.database); pivot != nil {
		if head := cs.handler.chain.CurrentBlock(); head.NumberU64() < *pivot {
			block := cs.handler.chain.CurrentFastBlock()
			td := cs.handler.chain.GetTdByHash(block.Hash())
288 289 290 291
			return downloader.FastSync, td
		}
	}
	// Nope, we're really full syncing
292 293
	head := cs.handler.chain.CurrentHeader()
	td := cs.handler.chain.GetTd(head.Hash(), head.Number.Uint64())
294
	return downloader.FullSync, td
295 296 297 298 299
}

// startSync launches doSync in a new goroutine.
func (cs *chainSyncer) startSync(op *chainSyncOp) {
	cs.doneCh = make(chan error, 1)
300
	go func() { cs.doneCh <- cs.handler.doSync(op) }()
301 302 303
}

// doSync synchronizes the local blockchain with a remote peer.
304 305
func (h *handler) doSync(op *chainSyncOp) error {
	if op.mode == downloader.FastSync || op.mode == downloader.SnapSync {
306 307 308 309 310 311 312 313 314
		// Before launch the fast sync, we have to ensure user uses the same
		// txlookup limit.
		// The main concern here is: during the fast sync Geth won't index the
		// block(generate tx indices) before the HEAD-limit. But if user changes
		// the limit in the next fast sync(e.g. user kill Geth manually and
		// restart) then it will be hard for Geth to figure out the oldest block
		// has been indexed. So here for the user-experience wise, it's non-optimal
		// that user can't change limit during the fast sync. If changed, Geth
		// will just blindly use the original one.
315 316 317
		limit := h.chain.TxLookupLimit()
		if stored := rawdb.ReadFastTxLookupLimit(h.database); stored == nil {
			rawdb.WriteFastTxLookupLimit(h.database, limit)
318
		} else if *stored != limit {
319
			h.chain.SetTxLookupLimit(*stored)
320 321 322
			log.Warn("Update txLookup limit", "provided", limit, "updated", *stored)
		}
	}
323
	// Run the sync cycle, and disable fast sync if we're past the pivot block
324
	err := h.downloader.Synchronise(op.peer.ID(), op.head, op.td, op.mode)
325 326
	if err != nil {
		return err
327
	}
328
	if atomic.LoadUint32(&h.fastSync) == 1 {
329
		log.Info("Fast sync complete, auto disabling")
330
		atomic.StoreUint32(&h.fastSync, 0)
331
	}
332 333 334 335
	if atomic.LoadUint32(&h.snapSync) == 1 {
		log.Info("Snap sync complete, auto disabling")
		atomic.StoreUint32(&h.snapSync, 0)
	}
336 337
	// If we've successfully finished a sync cycle and passed any required checkpoint,
	// enable accepting transactions from the network.
338 339
	head := h.chain.CurrentBlock()
	if head.NumberU64() >= h.checkpointNumber {
340 341 342
		// Checkpoint passed, sanity check the timestamp to have a fallback mechanism
		// for non-checkpointed (number = 0) private networks.
		if head.Time() >= uint64(time.Now().AddDate(0, -1, 0).Unix()) {
343
			atomic.StoreUint32(&h.acceptTxs, 1)
344 345 346
		}
	}
	if head.NumberU64() > 0 {
347 348 349 350 351 352
		// We've completed a sync cycle, notify all peers of new state. This path is
		// essential in star-topology networks where a gateway node needs to notify
		// all its out-of-date peers of the availability of a new block. This failure
		// scenario will most often crop up in private and hackathon networks with
		// degenerate connectivity, but it should be healthy for the mainnet too to
		// more reliably update peers or the local TD state.
353
		h.BroadcastBlock(head, false)
354
	}
355
	return nil
356
}