sync_test.go 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359
  1. // Copyright 2015 The go-ethereum Authors
  2. // This file is part of the go-ethereum library.
  3. //
  4. // The go-ethereum library is free software: you can redistribute it and/or modify
  5. // it under the terms of the GNU Lesser General Public License as published by
  6. // the Free Software Foundation, either version 3 of the License, or
  7. // (at your option) any later version.
  8. //
  9. // The go-ethereum library is distributed in the hope that it will be useful,
  10. // but WITHOUT ANY WARRANTY; without even the implied warranty of
  11. // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  12. // GNU Lesser General Public License for more details.
  13. //
  14. // You should have received a copy of the GNU Lesser General Public License
  15. // along with the go-ethereum library. If not, see <http://www.gnu.org/licenses/>.
  16. package trie
  17. import (
  18. "bytes"
  19. "testing"
  20. "github.com/ethereum/go-ethereum/common"
  21. "github.com/ethereum/go-ethereum/ethdb"
  22. )
  23. // makeTestTrie create a sample test trie to test node-wise reconstruction.
  24. func makeTestTrie() (*Database, *Trie, map[string][]byte) {
  25. // Create an empty trie
  26. triedb := NewDatabase(ethdb.NewMemDatabase())
  27. trie, _ := New(common.Hash{}, triedb)
  28. // Fill it with some arbitrary data
  29. content := make(map[string][]byte)
  30. for i := byte(0); i < 255; i++ {
  31. // Map the same data under multiple keys
  32. key, val := common.LeftPadBytes([]byte{1, i}, 32), []byte{i}
  33. content[string(key)] = val
  34. trie.Update(key, val)
  35. key, val = common.LeftPadBytes([]byte{2, i}, 32), []byte{i}
  36. content[string(key)] = val
  37. trie.Update(key, val)
  38. // Add some other data to inflate the trie
  39. for j := byte(3); j < 13; j++ {
  40. key, val = common.LeftPadBytes([]byte{j, i}, 32), []byte{j, i}
  41. content[string(key)] = val
  42. trie.Update(key, val)
  43. }
  44. }
  45. trie.Commit(nil)
  46. // Return the generated trie
  47. return triedb, trie, content
  48. }
  49. // checkTrieContents cross references a reconstructed trie with an expected data
  50. // content map.
  51. func checkTrieContents(t *testing.T, db *Database, root []byte, content map[string][]byte) {
  52. // Check root availability and trie contents
  53. trie, err := New(common.BytesToHash(root), db)
  54. if err != nil {
  55. t.Fatalf("failed to create trie at %x: %v", root, err)
  56. }
  57. if err := checkTrieConsistency(db, common.BytesToHash(root)); err != nil {
  58. t.Fatalf("inconsistent trie at %x: %v", root, err)
  59. }
  60. for key, val := range content {
  61. if have := trie.Get([]byte(key)); !bytes.Equal(have, val) {
  62. t.Errorf("entry %x: content mismatch: have %x, want %x", key, have, val)
  63. }
  64. }
  65. }
  66. // checkTrieConsistency checks that all nodes in a trie are indeed present.
  67. func checkTrieConsistency(db *Database, root common.Hash) error {
  68. // Create and iterate a trie rooted in a subnode
  69. trie, err := New(root, db)
  70. if err != nil {
  71. return nil // Consider a non existent state consistent
  72. }
  73. it := trie.NodeIterator(nil)
  74. for it.Next(true) {
  75. }
  76. return it.Error()
  77. }
  78. // Tests that an empty trie is not scheduled for syncing.
  79. func TestEmptySync(t *testing.T) {
  80. dbA := NewDatabase(ethdb.NewMemDatabase())
  81. dbB := NewDatabase(ethdb.NewMemDatabase())
  82. emptyA, _ := New(common.Hash{}, dbA)
  83. emptyB, _ := New(emptyRoot, dbB)
  84. for i, trie := range []*Trie{emptyA, emptyB} {
  85. if req := NewSync(trie.Hash(), ethdb.NewMemDatabase(), nil).Missing(1); len(req) != 0 {
  86. t.Errorf("test %d: content requested for empty trie: %v", i, req)
  87. }
  88. }
  89. }
  90. // Tests that given a root hash, a trie can sync iteratively on a single thread,
  91. // requesting retrieval tasks and returning all of them in one go.
  92. func TestIterativeSyncIndividual(t *testing.T) { testIterativeSync(t, 1) }
  93. func TestIterativeSyncBatched(t *testing.T) { testIterativeSync(t, 100) }
  94. func testIterativeSync(t *testing.T, batch int) {
  95. // Create a random trie to copy
  96. srcDb, srcTrie, srcData := makeTestTrie()
  97. // Create a destination trie and sync with the scheduler
  98. diskdb := ethdb.NewMemDatabase()
  99. triedb := NewDatabase(diskdb)
  100. sched := NewSync(srcTrie.Hash(), diskdb, nil)
  101. queue := append([]common.Hash{}, sched.Missing(batch)...)
  102. for len(queue) > 0 {
  103. results := make([]SyncResult, len(queue))
  104. for i, hash := range queue {
  105. data, err := srcDb.Node(hash)
  106. if err != nil {
  107. t.Fatalf("failed to retrieve node data for %x: %v", hash, err)
  108. }
  109. results[i] = SyncResult{hash, data}
  110. }
  111. if _, index, err := sched.Process(results); err != nil {
  112. t.Fatalf("failed to process result #%d: %v", index, err)
  113. }
  114. if index, err := sched.Commit(diskdb); err != nil {
  115. t.Fatalf("failed to commit data #%d: %v", index, err)
  116. }
  117. queue = append(queue[:0], sched.Missing(batch)...)
  118. }
  119. // Cross check that the two tries are in sync
  120. checkTrieContents(t, triedb, srcTrie.Root(), srcData)
  121. }
  122. // Tests that the trie scheduler can correctly reconstruct the state even if only
  123. // partial results are returned, and the others sent only later.
  124. func TestIterativeDelayedSync(t *testing.T) {
  125. // Create a random trie to copy
  126. srcDb, srcTrie, srcData := makeTestTrie()
  127. // Create a destination trie and sync with the scheduler
  128. diskdb := ethdb.NewMemDatabase()
  129. triedb := NewDatabase(diskdb)
  130. sched := NewSync(srcTrie.Hash(), diskdb, nil)
  131. queue := append([]common.Hash{}, sched.Missing(10000)...)
  132. for len(queue) > 0 {
  133. // Sync only half of the scheduled nodes
  134. results := make([]SyncResult, len(queue)/2+1)
  135. for i, hash := range queue[:len(results)] {
  136. data, err := srcDb.Node(hash)
  137. if err != nil {
  138. t.Fatalf("failed to retrieve node data for %x: %v", hash, err)
  139. }
  140. results[i] = SyncResult{hash, data}
  141. }
  142. if _, index, err := sched.Process(results); err != nil {
  143. t.Fatalf("failed to process result #%d: %v", index, err)
  144. }
  145. if index, err := sched.Commit(diskdb); err != nil {
  146. t.Fatalf("failed to commit data #%d: %v", index, err)
  147. }
  148. queue = append(queue[len(results):], sched.Missing(10000)...)
  149. }
  150. // Cross check that the two tries are in sync
  151. checkTrieContents(t, triedb, srcTrie.Root(), srcData)
  152. }
  153. // Tests that given a root hash, a trie can sync iteratively on a single thread,
  154. // requesting retrieval tasks and returning all of them in one go, however in a
  155. // random order.
  156. func TestIterativeRandomSyncIndividual(t *testing.T) { testIterativeRandomSync(t, 1) }
  157. func TestIterativeRandomSyncBatched(t *testing.T) { testIterativeRandomSync(t, 100) }
  158. func testIterativeRandomSync(t *testing.T, batch int) {
  159. // Create a random trie to copy
  160. srcDb, srcTrie, srcData := makeTestTrie()
  161. // Create a destination trie and sync with the scheduler
  162. diskdb := ethdb.NewMemDatabase()
  163. triedb := NewDatabase(diskdb)
  164. sched := NewSync(srcTrie.Hash(), diskdb, nil)
  165. queue := make(map[common.Hash]struct{})
  166. for _, hash := range sched.Missing(batch) {
  167. queue[hash] = struct{}{}
  168. }
  169. for len(queue) > 0 {
  170. // Fetch all the queued nodes in a random order
  171. results := make([]SyncResult, 0, len(queue))
  172. for hash := range queue {
  173. data, err := srcDb.Node(hash)
  174. if err != nil {
  175. t.Fatalf("failed to retrieve node data for %x: %v", hash, err)
  176. }
  177. results = append(results, SyncResult{hash, data})
  178. }
  179. // Feed the retrieved results back and queue new tasks
  180. if _, index, err := sched.Process(results); err != nil {
  181. t.Fatalf("failed to process result #%d: %v", index, err)
  182. }
  183. if index, err := sched.Commit(diskdb); err != nil {
  184. t.Fatalf("failed to commit data #%d: %v", index, err)
  185. }
  186. queue = make(map[common.Hash]struct{})
  187. for _, hash := range sched.Missing(batch) {
  188. queue[hash] = struct{}{}
  189. }
  190. }
  191. // Cross check that the two tries are in sync
  192. checkTrieContents(t, triedb, srcTrie.Root(), srcData)
  193. }
  194. // Tests that the trie scheduler can correctly reconstruct the state even if only
  195. // partial results are returned (Even those randomly), others sent only later.
  196. func TestIterativeRandomDelayedSync(t *testing.T) {
  197. // Create a random trie to copy
  198. srcDb, srcTrie, srcData := makeTestTrie()
  199. // Create a destination trie and sync with the scheduler
  200. diskdb := ethdb.NewMemDatabase()
  201. triedb := NewDatabase(diskdb)
  202. sched := NewSync(srcTrie.Hash(), diskdb, nil)
  203. queue := make(map[common.Hash]struct{})
  204. for _, hash := range sched.Missing(10000) {
  205. queue[hash] = struct{}{}
  206. }
  207. for len(queue) > 0 {
  208. // Sync only half of the scheduled nodes, even those in random order
  209. results := make([]SyncResult, 0, len(queue)/2+1)
  210. for hash := range queue {
  211. data, err := srcDb.Node(hash)
  212. if err != nil {
  213. t.Fatalf("failed to retrieve node data for %x: %v", hash, err)
  214. }
  215. results = append(results, SyncResult{hash, data})
  216. if len(results) >= cap(results) {
  217. break
  218. }
  219. }
  220. // Feed the retrieved results back and queue new tasks
  221. if _, index, err := sched.Process(results); err != nil {
  222. t.Fatalf("failed to process result #%d: %v", index, err)
  223. }
  224. if index, err := sched.Commit(diskdb); err != nil {
  225. t.Fatalf("failed to commit data #%d: %v", index, err)
  226. }
  227. for _, result := range results {
  228. delete(queue, result.Hash)
  229. }
  230. for _, hash := range sched.Missing(10000) {
  231. queue[hash] = struct{}{}
  232. }
  233. }
  234. // Cross check that the two tries are in sync
  235. checkTrieContents(t, triedb, srcTrie.Root(), srcData)
  236. }
  237. // Tests that a trie sync will not request nodes multiple times, even if they
  238. // have such references.
  239. func TestDuplicateAvoidanceSync(t *testing.T) {
  240. // Create a random trie to copy
  241. srcDb, srcTrie, srcData := makeTestTrie()
  242. // Create a destination trie and sync with the scheduler
  243. diskdb := ethdb.NewMemDatabase()
  244. triedb := NewDatabase(diskdb)
  245. sched := NewSync(srcTrie.Hash(), diskdb, nil)
  246. queue := append([]common.Hash{}, sched.Missing(0)...)
  247. requested := make(map[common.Hash]struct{})
  248. for len(queue) > 0 {
  249. results := make([]SyncResult, len(queue))
  250. for i, hash := range queue {
  251. data, err := srcDb.Node(hash)
  252. if err != nil {
  253. t.Fatalf("failed to retrieve node data for %x: %v", hash, err)
  254. }
  255. if _, ok := requested[hash]; ok {
  256. t.Errorf("hash %x already requested once", hash)
  257. }
  258. requested[hash] = struct{}{}
  259. results[i] = SyncResult{hash, data}
  260. }
  261. if _, index, err := sched.Process(results); err != nil {
  262. t.Fatalf("failed to process result #%d: %v", index, err)
  263. }
  264. if index, err := sched.Commit(diskdb); err != nil {
  265. t.Fatalf("failed to commit data #%d: %v", index, err)
  266. }
  267. queue = append(queue[:0], sched.Missing(0)...)
  268. }
  269. // Cross check that the two tries are in sync
  270. checkTrieContents(t, triedb, srcTrie.Root(), srcData)
  271. }
  272. // Tests that at any point in time during a sync, only complete sub-tries are in
  273. // the database.
  274. func TestIncompleteSync(t *testing.T) {
  275. // Create a random trie to copy
  276. srcDb, srcTrie, _ := makeTestTrie()
  277. // Create a destination trie and sync with the scheduler
  278. diskdb := ethdb.NewMemDatabase()
  279. triedb := NewDatabase(diskdb)
  280. sched := NewSync(srcTrie.Hash(), diskdb, nil)
  281. added := []common.Hash{}
  282. queue := append([]common.Hash{}, sched.Missing(1)...)
  283. for len(queue) > 0 {
  284. // Fetch a batch of trie nodes
  285. results := make([]SyncResult, len(queue))
  286. for i, hash := range queue {
  287. data, err := srcDb.Node(hash)
  288. if err != nil {
  289. t.Fatalf("failed to retrieve node data for %x: %v", hash, err)
  290. }
  291. results[i] = SyncResult{hash, data}
  292. }
  293. // Process each of the trie nodes
  294. if _, index, err := sched.Process(results); err != nil {
  295. t.Fatalf("failed to process result #%d: %v", index, err)
  296. }
  297. if index, err := sched.Commit(diskdb); err != nil {
  298. t.Fatalf("failed to commit data #%d: %v", index, err)
  299. }
  300. for _, result := range results {
  301. added = append(added, result.Hash)
  302. }
  303. // Check that all known sub-tries in the synced trie are complete
  304. for _, root := range added {
  305. if err := checkTrieConsistency(triedb, root); err != nil {
  306. t.Fatalf("trie inconsistent: %v", err)
  307. }
  308. }
  309. // Fetch the next batch to retrieve
  310. queue = append(queue[:0], sched.Missing(1)...)
  311. }
  312. // Sanity check that removing any node from the database is detected
  313. for _, node := range added[1:] {
  314. key := node.Bytes()
  315. value, _ := diskdb.Get(key)
  316. diskdb.Delete(key)
  317. if err := checkTrieConsistency(triedb, added[0]); err == nil {
  318. t.Fatalf("trie inconsistency not caught, missing: %x", key)
  319. }
  320. diskdb.Put(key, value)
  321. }
  322. }