freezer.go 16 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498
  1. // Copyright 2019 The go-ethereum Authors
  2. // This file is part of the go-ethereum library.
  3. //
  4. // The go-ethereum library is free software: you can redistribute it and/or modify
  5. // it under the terms of the GNU Lesser General Public License as published by
  6. // the Free Software Foundation, either version 3 of the License, or
  7. // (at your option) any later version.
  8. //
  9. // The go-ethereum library is distributed in the hope that it will be useful,
  10. // but WITHOUT ANY WARRANTY; without even the implied warranty of
  11. // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  12. // GNU Lesser General Public License for more details.
  13. //
  14. // You should have received a copy of the GNU Lesser General Public License
  15. // along with the go-ethereum library. If not, see <http://www.gnu.org/licenses/>.
  16. package rawdb
  17. import (
  18. "errors"
  19. "fmt"
  20. "math"
  21. "os"
  22. "path/filepath"
  23. "sync"
  24. "sync/atomic"
  25. "time"
  26. "github.com/ethereum/go-ethereum/common"
  27. "github.com/ethereum/go-ethereum/ethdb"
  28. "github.com/ethereum/go-ethereum/log"
  29. "github.com/ethereum/go-ethereum/metrics"
  30. "github.com/ethereum/go-ethereum/params"
  31. "github.com/prometheus/tsdb/fileutil"
  32. )
  33. var (
  34. // errReadOnly is returned if the freezer is opened in read only mode. All the
  35. // mutations are disallowed.
  36. errReadOnly = errors.New("read only")
  37. // errUnknownTable is returned if the user attempts to read from a table that is
  38. // not tracked by the freezer.
  39. errUnknownTable = errors.New("unknown table")
  40. // errOutOrderInsertion is returned if the user attempts to inject out-of-order
  41. // binary blobs into the freezer.
  42. errOutOrderInsertion = errors.New("the append operation is out-order")
  43. // errSymlinkDatadir is returned if the ancient directory specified by user
  44. // is a symbolic link.
  45. errSymlinkDatadir = errors.New("symbolic link datadir is not supported")
  46. )
  47. const (
  48. // freezerRecheckInterval is the frequency to check the key-value database for
  49. // chain progression that might permit new blocks to be frozen into immutable
  50. // storage.
  51. freezerRecheckInterval = time.Minute
  52. // freezerBatchLimit is the maximum number of blocks to freeze in one batch
  53. // before doing an fsync and deleting it from the key-value store.
  54. freezerBatchLimit = 30000
  55. )
  56. // freezer is an memory mapped append-only database to store immutable chain data
  57. // into flat files:
  58. //
  59. // - The append only nature ensures that disk writes are minimized.
  60. // - The memory mapping ensures we can max out system memory for caching without
  61. // reserving it for go-ethereum. This would also reduce the memory requirements
  62. // of Geth, and thus also GC overhead.
  63. type freezer struct {
  64. // WARNING: The `frozen` field is accessed atomically. On 32 bit platforms, only
  65. // 64-bit aligned fields can be atomic. The struct is guaranteed to be so aligned,
  66. // so take advantage of that (https://golang.org/pkg/sync/atomic/#pkg-note-BUG).
  67. frozen uint64 // Number of blocks already frozen
  68. threshold uint64 // Number of recent blocks not to freeze (params.FullImmutabilityThreshold apart from tests)
  69. readonly bool
  70. tables map[string]*freezerTable // Data tables for storing everything
  71. instanceLock fileutil.Releaser // File-system lock to prevent double opens
  72. trigger chan chan struct{} // Manual blocking freeze trigger, test determinism
  73. quit chan struct{}
  74. closeOnce sync.Once
  75. }
  76. // newFreezer creates a chain freezer that moves ancient chain data into
  77. // append-only flat file containers.
  78. func newFreezer(datadir string, namespace string, readonly bool) (*freezer, error) {
  79. // Create the initial freezer object
  80. var (
  81. readMeter = metrics.NewRegisteredMeter(namespace+"ancient/read", nil)
  82. writeMeter = metrics.NewRegisteredMeter(namespace+"ancient/write", nil)
  83. sizeGauge = metrics.NewRegisteredGauge(namespace+"ancient/size", nil)
  84. )
  85. // Ensure the datadir is not a symbolic link if it exists.
  86. if info, err := os.Lstat(datadir); !os.IsNotExist(err) {
  87. if info.Mode()&os.ModeSymlink != 0 {
  88. log.Warn("Symbolic link ancient database is not supported", "path", datadir)
  89. return nil, errSymlinkDatadir
  90. }
  91. }
  92. // Leveldb uses LOCK as the filelock filename. To prevent the
  93. // name collision, we use FLOCK as the lock name.
  94. lock, _, err := fileutil.Flock(filepath.Join(datadir, "FLOCK"))
  95. if err != nil {
  96. return nil, err
  97. }
  98. // Open all the supported data tables
  99. freezer := &freezer{
  100. readonly: readonly,
  101. threshold: params.FullImmutabilityThreshold,
  102. tables: make(map[string]*freezerTable),
  103. instanceLock: lock,
  104. trigger: make(chan chan struct{}),
  105. quit: make(chan struct{}),
  106. }
  107. for name, disableSnappy := range FreezerNoSnappy {
  108. table, err := newTable(datadir, name, readMeter, writeMeter, sizeGauge, disableSnappy)
  109. if err != nil {
  110. for _, table := range freezer.tables {
  111. table.Close()
  112. }
  113. lock.Release()
  114. return nil, err
  115. }
  116. freezer.tables[name] = table
  117. }
  118. if err := freezer.repair(); err != nil {
  119. for _, table := range freezer.tables {
  120. table.Close()
  121. }
  122. lock.Release()
  123. return nil, err
  124. }
  125. log.Info("Opened ancient database", "database", datadir, "readonly", readonly)
  126. return freezer, nil
  127. }
  128. // Close terminates the chain freezer, unmapping all the data files.
  129. func (f *freezer) Close() error {
  130. var errs []error
  131. f.closeOnce.Do(func() {
  132. close(f.quit)
  133. for _, table := range f.tables {
  134. if err := table.Close(); err != nil {
  135. errs = append(errs, err)
  136. }
  137. }
  138. if err := f.instanceLock.Release(); err != nil {
  139. errs = append(errs, err)
  140. }
  141. })
  142. if errs != nil {
  143. return fmt.Errorf("%v", errs)
  144. }
  145. return nil
  146. }
  147. // HasAncient returns an indicator whether the specified ancient data exists
  148. // in the freezer.
  149. func (f *freezer) HasAncient(kind string, number uint64) (bool, error) {
  150. if table := f.tables[kind]; table != nil {
  151. return table.has(number), nil
  152. }
  153. return false, nil
  154. }
  155. // Ancient retrieves an ancient binary blob from the append-only immutable files.
  156. func (f *freezer) Ancient(kind string, number uint64) ([]byte, error) {
  157. if table := f.tables[kind]; table != nil {
  158. return table.Retrieve(number)
  159. }
  160. return nil, errUnknownTable
  161. }
  162. // Ancients returns the length of the frozen items.
  163. func (f *freezer) Ancients() (uint64, error) {
  164. return atomic.LoadUint64(&f.frozen), nil
  165. }
  166. // AncientSize returns the ancient size of the specified category.
  167. func (f *freezer) AncientSize(kind string) (uint64, error) {
  168. if table := f.tables[kind]; table != nil {
  169. return table.size()
  170. }
  171. return 0, errUnknownTable
  172. }
  173. // AppendAncient injects all binary blobs belong to block at the end of the
  174. // append-only immutable table files.
  175. //
  176. // Notably, this function is lock free but kind of thread-safe. All out-of-order
  177. // injection will be rejected. But if two injections with same number happen at
  178. // the same time, we can get into the trouble.
  179. func (f *freezer) AppendAncient(number uint64, hash, header, body, receipts, td []byte) (err error) {
  180. if f.readonly {
  181. return errReadOnly
  182. }
  183. // Ensure the binary blobs we are appending is continuous with freezer.
  184. if atomic.LoadUint64(&f.frozen) != number {
  185. return errOutOrderInsertion
  186. }
  187. // Rollback all inserted data if any insertion below failed to ensure
  188. // the tables won't out of sync.
  189. defer func() {
  190. if err != nil {
  191. rerr := f.repair()
  192. if rerr != nil {
  193. log.Crit("Failed to repair freezer", "err", rerr)
  194. }
  195. log.Info("Append ancient failed", "number", number, "err", err)
  196. }
  197. }()
  198. // Inject all the components into the relevant data tables
  199. if err := f.tables[freezerHashTable].Append(f.frozen, hash[:]); err != nil {
  200. log.Error("Failed to append ancient hash", "number", f.frozen, "hash", hash, "err", err)
  201. return err
  202. }
  203. if err := f.tables[freezerHeaderTable].Append(f.frozen, header); err != nil {
  204. log.Error("Failed to append ancient header", "number", f.frozen, "hash", hash, "err", err)
  205. return err
  206. }
  207. if err := f.tables[freezerBodiesTable].Append(f.frozen, body); err != nil {
  208. log.Error("Failed to append ancient body", "number", f.frozen, "hash", hash, "err", err)
  209. return err
  210. }
  211. if err := f.tables[freezerReceiptTable].Append(f.frozen, receipts); err != nil {
  212. log.Error("Failed to append ancient receipts", "number", f.frozen, "hash", hash, "err", err)
  213. return err
  214. }
  215. if err := f.tables[freezerDifficultyTable].Append(f.frozen, td); err != nil {
  216. log.Error("Failed to append ancient difficulty", "number", f.frozen, "hash", hash, "err", err)
  217. return err
  218. }
  219. atomic.AddUint64(&f.frozen, 1) // Only modify atomically
  220. return nil
  221. }
  222. // TruncateAncients discards any recent data above the provided threshold number.
  223. func (f *freezer) TruncateAncients(items uint64) error {
  224. if f.readonly {
  225. return errReadOnly
  226. }
  227. if atomic.LoadUint64(&f.frozen) <= items {
  228. return nil
  229. }
  230. for _, table := range f.tables {
  231. if err := table.truncate(items); err != nil {
  232. return err
  233. }
  234. }
  235. atomic.StoreUint64(&f.frozen, items)
  236. return nil
  237. }
  238. // Sync flushes all data tables to disk.
  239. func (f *freezer) Sync() error {
  240. return f.SyncRetry(1, 1*time.Second)
  241. }
  242. // SyncRetry
  243. // Quorum
  244. // add retry to sync
  245. func (f *freezer) SyncRetry(retry uint8, delay time.Duration) error {
  246. var errs []error
  247. for _, table := range f.tables {
  248. if err := table.Sync(); err != nil {
  249. errs = append(errs, err)
  250. }
  251. }
  252. hasError := len(errs) > 0
  253. if hasError && retry < 5 {
  254. log.Info("sync", "retry", retry, "errors", errs)
  255. time.Sleep(delay)
  256. return f.SyncRetry(retry+1, delay*2)
  257. } else if hasError {
  258. return fmt.Errorf("%v", errs)
  259. }
  260. return nil
  261. }
  262. // End Quorum
  263. // freeze is a background thread that periodically checks the blockchain for any
  264. // import progress and moves ancient data from the fast database into the freezer.
  265. //
  266. // This functionality is deliberately broken off from block importing to avoid
  267. // incurring additional data shuffling delays on block propagation.
  268. func (f *freezer) freeze(db ethdb.KeyValueStore) {
  269. nfdb := &nofreezedb{KeyValueStore: db}
  270. var (
  271. backoff bool
  272. triggered chan struct{} // Used in tests
  273. )
  274. for {
  275. select {
  276. case <-f.quit:
  277. log.Info("Freezer shutting down")
  278. return
  279. default:
  280. }
  281. if backoff {
  282. // If we were doing a manual trigger, notify it
  283. if triggered != nil {
  284. triggered <- struct{}{}
  285. triggered = nil
  286. }
  287. select {
  288. case <-time.NewTimer(freezerRecheckInterval).C:
  289. backoff = false
  290. case triggered = <-f.trigger:
  291. backoff = false
  292. case <-f.quit:
  293. return
  294. }
  295. }
  296. // Retrieve the freezing threshold.
  297. hash := ReadHeadBlockHash(nfdb)
  298. if hash == (common.Hash{}) {
  299. log.Debug("Current full block hash unavailable") // new chain, empty database
  300. backoff = true
  301. continue
  302. }
  303. number := ReadHeaderNumber(nfdb, hash)
  304. threshold := int(atomic.LoadUint64(&f.threshold))
  305. switch {
  306. case number == nil:
  307. log.Error("Current full block number unavailable", "hash", hash)
  308. backoff = true
  309. continue
  310. case *number < uint64(params.GetImmutabilityThresholdWithDefault(threshold)):
  311. log.Debug("Current full block not old enough", "number", *number, "hash", hash, "delay", params.GetImmutabilityThresholdWithDefault(threshold))
  312. backoff = true
  313. continue
  314. case *number-uint64(params.GetImmutabilityThresholdWithDefault(threshold)) <= f.frozen:
  315. log.Debug("Ancient blocks frozen already", "number", *number, "hash", hash, "frozen", f.frozen)
  316. backoff = true
  317. continue
  318. }
  319. head := ReadHeader(nfdb, hash, *number)
  320. if head == nil {
  321. log.Error("Current full block unavailable", "number", *number, "hash", hash)
  322. backoff = true
  323. continue
  324. }
  325. // Seems we have data ready to be frozen, process in usable batches
  326. limit := *number - uint64(params.GetImmutabilityThresholdWithDefault(threshold))
  327. if limit-f.frozen > freezerBatchLimit {
  328. limit = f.frozen + freezerBatchLimit
  329. }
  330. var (
  331. start = time.Now()
  332. first = f.frozen
  333. ancients = make([]common.Hash, 0, limit-f.frozen)
  334. )
  335. for f.frozen <= limit {
  336. // Retrieves all the components of the canonical block
  337. hash := ReadCanonicalHash(nfdb, f.frozen)
  338. if hash == (common.Hash{}) {
  339. log.Error("Canonical hash missing, can't freeze", "number", f.frozen)
  340. break
  341. }
  342. header := ReadHeaderRLP(nfdb, hash, f.frozen)
  343. if len(header) == 0 {
  344. log.Error("Block header missing, can't freeze", "number", f.frozen, "hash", hash)
  345. break
  346. }
  347. body := ReadBodyRLP(nfdb, hash, f.frozen)
  348. if len(body) == 0 {
  349. log.Error("Block body missing, can't freeze", "number", f.frozen, "hash", hash)
  350. break
  351. }
  352. receipts := ReadReceiptsRLP(nfdb, hash, f.frozen)
  353. if len(receipts) == 0 {
  354. log.Error("Block receipts missing, can't freeze", "number", f.frozen, "hash", hash)
  355. break
  356. }
  357. td := ReadTdRLP(nfdb, hash, f.frozen)
  358. if len(td) == 0 {
  359. log.Error("Total difficulty missing, can't freeze", "number", f.frozen, "hash", hash)
  360. break
  361. }
  362. log.Trace("Deep froze ancient block", "number", f.frozen, "hash", hash)
  363. // Inject all the components into the relevant data tables
  364. if err := f.AppendAncient(f.frozen, hash[:], header, body, receipts, td); err != nil {
  365. break
  366. }
  367. ancients = append(ancients, hash)
  368. }
  369. // Batch of blocks have been frozen, flush them before wiping from leveldb
  370. if err := f.Sync(); err != nil {
  371. log.Crit("Failed to flush frozen tables", "err", err)
  372. }
  373. // Wipe out all data from the active database
  374. batch := db.NewBatch()
  375. for i := 0; i < len(ancients); i++ {
  376. // Always keep the genesis block in active database
  377. if first+uint64(i) != 0 {
  378. DeleteBlockWithoutNumber(batch, ancients[i], first+uint64(i))
  379. DeleteCanonicalHash(batch, first+uint64(i))
  380. }
  381. }
  382. if err := batch.Write(); err != nil {
  383. log.Crit("Failed to delete frozen canonical blocks", "err", err)
  384. }
  385. batch.Reset()
  386. // Wipe out side chains also and track dangling side chians
  387. var dangling []common.Hash
  388. for number := first; number < f.frozen; number++ {
  389. // Always keep the genesis block in active database
  390. if number != 0 {
  391. dangling = ReadAllHashes(db, number)
  392. for _, hash := range dangling {
  393. log.Trace("Deleting side chain", "number", number, "hash", hash)
  394. DeleteBlock(batch, hash, number)
  395. }
  396. }
  397. }
  398. if err := batch.Write(); err != nil {
  399. log.Crit("Failed to delete frozen side blocks", "err", err)
  400. }
  401. batch.Reset()
  402. // Step into the future and delete and dangling side chains
  403. if f.frozen > 0 {
  404. tip := f.frozen
  405. for len(dangling) > 0 {
  406. drop := make(map[common.Hash]struct{})
  407. for _, hash := range dangling {
  408. log.Debug("Dangling parent from freezer", "number", tip-1, "hash", hash)
  409. drop[hash] = struct{}{}
  410. }
  411. children := ReadAllHashes(db, tip)
  412. for i := 0; i < len(children); i++ {
  413. // Dig up the child and ensure it's dangling
  414. child := ReadHeader(nfdb, children[i], tip)
  415. if child == nil {
  416. log.Error("Missing dangling header", "number", tip, "hash", children[i])
  417. continue
  418. }
  419. if _, ok := drop[child.ParentHash]; !ok {
  420. children = append(children[:i], children[i+1:]...)
  421. i--
  422. continue
  423. }
  424. // Delete all block data associated with the child
  425. log.Debug("Deleting dangling block", "number", tip, "hash", children[i], "parent", child.ParentHash)
  426. DeleteBlock(batch, children[i], tip)
  427. }
  428. dangling = children
  429. tip++
  430. }
  431. if err := batch.Write(); err != nil {
  432. log.Crit("Failed to delete dangling side blocks", "err", err)
  433. }
  434. }
  435. // Log something friendly for the user
  436. context := []interface{}{
  437. "blocks", f.frozen - first, "elapsed", common.PrettyDuration(time.Since(start)), "number", f.frozen - 1,
  438. }
  439. if n := len(ancients); n > 0 {
  440. context = append(context, []interface{}{"hash", ancients[n-1]}...)
  441. }
  442. log.Info("Deep froze chain segment", context...)
  443. // Avoid database thrashing with tiny writes
  444. if f.frozen-first < freezerBatchLimit {
  445. backoff = true
  446. }
  447. }
  448. }
  449. // repair truncates all data tables to the same length.
  450. func (f *freezer) repair() error {
  451. min := uint64(math.MaxUint64)
  452. for _, table := range f.tables {
  453. items := atomic.LoadUint64(&table.items)
  454. if min > items {
  455. min = items
  456. }
  457. }
  458. for _, table := range f.tables {
  459. if err := table.truncate(min); err != nil {
  460. return err
  461. }
  462. }
  463. atomic.StoreUint64(&f.frozen, min)
  464. return nil
  465. }