freezer.go 16 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496
  1. // Copyright 2019 The go-ethereum Authors
  2. // This file is part of the go-ethereum library.
  3. //
  4. // The go-ethereum library is free software: you can redistribute it and/or modify
  5. // it under the terms of the GNU Lesser General Public License as published by
  6. // the Free Software Foundation, either version 3 of the License, or
  7. // (at your option) any later version.
  8. //
  9. // The go-ethereum library is distributed in the hope that it will be useful,
  10. // but WITHOUT ANY WARRANTY; without even the implied warranty of
  11. // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  12. // GNU Lesser General Public License for more details.
  13. //
  14. // You should have received a copy of the GNU Lesser General Public License
  15. // along with the go-ethereum library. If not, see <http://www.gnu.org/licenses/>.
  16. package rawdb
  17. import (
  18. "errors"
  19. "fmt"
  20. "math"
  21. "os"
  22. "path/filepath"
  23. "sync"
  24. "sync/atomic"
  25. "time"
  26. "github.com/ethereum/go-ethereum/common"
  27. "github.com/ethereum/go-ethereum/ethdb"
  28. "github.com/ethereum/go-ethereum/log"
  29. "github.com/ethereum/go-ethereum/metrics"
  30. "github.com/ethereum/go-ethereum/params"
  31. "github.com/prometheus/tsdb/fileutil"
  32. )
  33. var (
  34. // errReadOnly is returned if the freezer is opened in read only mode. All the
  35. // mutations are disallowed.
  36. errReadOnly = errors.New("read only")
  37. // errUnknownTable is returned if the user attempts to read from a table that is
  38. // not tracked by the freezer.
  39. errUnknownTable = errors.New("unknown table")
  40. // errOutOrderInsertion is returned if the user attempts to inject out-of-order
  41. // binary blobs into the freezer.
  42. errOutOrderInsertion = errors.New("the append operation is out-order")
  43. // errSymlinkDatadir is returned if the ancient directory specified by user
  44. // is a symbolic link.
  45. errSymlinkDatadir = errors.New("symbolic link datadir is not supported")
  46. )
  47. const (
  48. // freezerRecheckInterval is the frequency to check the key-value database for
  49. // chain progression that might permit new blocks to be frozen into immutable
  50. // storage.
  51. freezerRecheckInterval = time.Minute
  52. // freezerBatchLimit is the maximum number of blocks to freeze in one batch
  53. // before doing an fsync and deleting it from the key-value store.
  54. freezerBatchLimit = 30000
  55. )
  56. // freezer is an memory mapped append-only database to store immutable chain data
  57. // into flat files:
  58. //
  59. // - The append only nature ensures that disk writes are minimized.
  60. // - The memory mapping ensures we can max out system memory for caching without
  61. // reserving it for go-ethereum. This would also reduce the memory requirements
  62. // of Geth, and thus also GC overhead.
  63. type freezer struct {
  64. // WARNING: The `frozen` field is accessed atomically. On 32 bit platforms, only
  65. // 64-bit aligned fields can be atomic. The struct is guaranteed to be so aligned,
  66. // so take advantage of that (https://golang.org/pkg/sync/atomic/#pkg-note-BUG).
  67. frozen uint64 // Number of blocks already frozen
  68. threshold uint64 // Number of recent blocks not to freeze (params.FullImmutabilityThreshold apart from tests)
  69. readonly bool
  70. tables map[string]*freezerTable // Data tables for storing everything
  71. instanceLock fileutil.Releaser // File-system lock to prevent double opens
  72. trigger chan chan struct{} // Manual blocking freeze trigger, test determinism
  73. quit chan struct{}
  74. closeOnce sync.Once
  75. offset uint64 // Starting BlockNumber in current freezer
  76. }
  77. // newFreezer creates a chain freezer that moves ancient chain data into
  78. // append-only flat file containers.
  79. func newFreezer(datadir string, namespace string, readonly bool) (*freezer, error) {
  80. // Create the initial freezer object
  81. var (
  82. readMeter = metrics.NewRegisteredMeter(namespace+"ancient/read", nil)
  83. writeMeter = metrics.NewRegisteredMeter(namespace+"ancient/write", nil)
  84. sizeGauge = metrics.NewRegisteredGauge(namespace+"ancient/size", nil)
  85. )
  86. // Ensure the datadir is not a symbolic link if it exists.
  87. if info, err := os.Lstat(datadir); !os.IsNotExist(err) {
  88. if info.Mode()&os.ModeSymlink != 0 {
  89. log.Warn("Symbolic link ancient database is not supported", "path", datadir)
  90. return nil, errSymlinkDatadir
  91. }
  92. }
  93. // Leveldb uses LOCK as the filelock filename. To prevent the
  94. // name collision, we use FLOCK as the lock name.
  95. lock, _, err := fileutil.Flock(filepath.Join(datadir, "FLOCK"))
  96. if err != nil {
  97. return nil, err
  98. }
  99. // Open all the supported data tables
  100. freezer := &freezer{
  101. readonly: readonly,
  102. threshold: params.FullImmutabilityThreshold,
  103. tables: make(map[string]*freezerTable),
  104. instanceLock: lock,
  105. trigger: make(chan chan struct{}),
  106. quit: make(chan struct{}),
  107. }
  108. for name, disableSnappy := range FreezerNoSnappy {
  109. table, err := newTable(datadir, name, readMeter, writeMeter, sizeGauge, disableSnappy)
  110. if err != nil {
  111. for _, table := range freezer.tables {
  112. table.Close()
  113. }
  114. lock.Release()
  115. return nil, err
  116. }
  117. freezer.tables[name] = table
  118. }
  119. if err := freezer.repair(); err != nil {
  120. for _, table := range freezer.tables {
  121. table.Close()
  122. }
  123. lock.Release()
  124. return nil, err
  125. }
  126. log.Info("Opened ancient database", "database", datadir, "readonly", readonly)
  127. return freezer, nil
  128. }
  129. // Close terminates the chain freezer, unmapping all the data files.
  130. func (f *freezer) Close() error {
  131. var errs []error
  132. f.closeOnce.Do(func() {
  133. close(f.quit)
  134. for _, table := range f.tables {
  135. if err := table.Close(); err != nil {
  136. errs = append(errs, err)
  137. }
  138. }
  139. if err := f.instanceLock.Release(); err != nil {
  140. errs = append(errs, err)
  141. }
  142. })
  143. if errs != nil {
  144. return fmt.Errorf("%v", errs)
  145. }
  146. return nil
  147. }
  148. // HasAncient returns an indicator whether the specified ancient data exists
  149. // in the freezer.
  150. func (f *freezer) HasAncient(kind string, number uint64) (bool, error) {
  151. if table := f.tables[kind]; table != nil {
  152. return table.has(number - f.offset), nil
  153. }
  154. return false, nil
  155. }
  156. // Ancient retrieves an ancient binary blob from the append-only immutable files.
  157. func (f *freezer) Ancient(kind string, number uint64) ([]byte, error) {
  158. if table := f.tables[kind]; table != nil {
  159. return table.Retrieve(number - f.offset)
  160. }
  161. return nil, errUnknownTable
  162. }
  163. // Ancients returns the length of the frozen items.
  164. func (f *freezer) Ancients() (uint64, error) {
  165. return atomic.LoadUint64(&f.frozen), nil
  166. }
  167. // ItemAmountInAncient returns the actual length of current ancientDB.
  168. func (f *freezer) ItemAmountInAncient() (uint64, error) {
  169. return atomic.LoadUint64(&f.frozen) - atomic.LoadUint64(&f.offset), nil
  170. }
  171. // AncientOffSet returns the offset of current ancientDB.
  172. func (f *freezer) AncientOffSet() uint64 {
  173. return atomic.LoadUint64(&f.offset)
  174. }
  175. // AncientSize returns the ancient size of the specified category.
  176. func (f *freezer) AncientSize(kind string) (uint64, error) {
  177. if table := f.tables[kind]; table != nil {
  178. return table.size()
  179. }
  180. return 0, errUnknownTable
  181. }
  182. // AppendAncient injects all binary blobs belong to block at the end of the
  183. // append-only immutable table files.
  184. //
  185. // Notably, this function is lock free but kind of thread-safe. All out-of-order
  186. // injection will be rejected. But if two injections with same number happen at
  187. // the same time, we can get into the trouble.
  188. func (f *freezer) AppendAncient(number uint64, hash, header, body, receipts, td []byte) (err error) {
  189. if f.readonly {
  190. return errReadOnly
  191. }
  192. // Ensure the binary blobs we are appending is continuous with freezer.
  193. if atomic.LoadUint64(&f.frozen) != number {
  194. return errOutOrderInsertion
  195. }
  196. // Rollback all inserted data if any insertion below failed to ensure
  197. // the tables won't out of sync.
  198. defer func() {
  199. if err != nil {
  200. rerr := f.repair()
  201. if rerr != nil {
  202. log.Crit("Failed to repair freezer", "err", rerr)
  203. }
  204. log.Info("Append ancient failed", "number", number, "err", err)
  205. }
  206. }()
  207. // Inject all the components into the relevant data tables
  208. if err := f.tables[freezerHashTable].Append(f.frozen-f.offset, hash[:]); err != nil {
  209. log.Error("Failed to append ancient hash", "number", f.frozen, "hash", hash, "err", err)
  210. return err
  211. }
  212. if err := f.tables[freezerHeaderTable].Append(f.frozen-f.offset, header); err != nil {
  213. log.Error("Failed to append ancient header", "number", f.frozen, "hash", hash, "err", err)
  214. return err
  215. }
  216. if err := f.tables[freezerBodiesTable].Append(f.frozen-f.offset, body); err != nil {
  217. log.Error("Failed to append ancient body", "number", f.frozen, "hash", hash, "err", err)
  218. return err
  219. }
  220. if err := f.tables[freezerReceiptTable].Append(f.frozen-f.offset, receipts); err != nil {
  221. log.Error("Failed to append ancient receipts", "number", f.frozen, "hash", hash, "err", err)
  222. return err
  223. }
  224. if err := f.tables[freezerDifficultyTable].Append(f.frozen-f.offset, td); err != nil {
  225. log.Error("Failed to append ancient difficulty", "number", f.frozen, "hash", hash, "err", err)
  226. return err
  227. }
  228. atomic.AddUint64(&f.frozen, 1) // Only modify atomically
  229. return nil
  230. }
  231. // TruncateAncients discards any recent data above the provided threshold number.
  232. func (f *freezer) TruncateAncients(items uint64) error {
  233. if f.readonly {
  234. return errReadOnly
  235. }
  236. if atomic.LoadUint64(&f.frozen) <= items {
  237. return nil
  238. }
  239. for _, table := range f.tables {
  240. if err := table.truncate(items - f.offset); err != nil {
  241. return err
  242. }
  243. }
  244. atomic.StoreUint64(&f.frozen, items)
  245. return nil
  246. }
  247. // Sync flushes all data tables to disk.
  248. func (f *freezer) Sync() error {
  249. var errs []error
  250. for _, table := range f.tables {
  251. if err := table.Sync(); err != nil {
  252. errs = append(errs, err)
  253. }
  254. }
  255. if errs != nil {
  256. return fmt.Errorf("%v", errs)
  257. }
  258. return nil
  259. }
  260. // freeze is a background thread that periodically checks the blockchain for any
  261. // import progress and moves ancient data from the fast database into the freezer.
  262. //
  263. // This functionality is deliberately broken off from block importing to avoid
  264. // incurring additional data shuffling delays on block propagation.
  265. func (f *freezer) freeze(db ethdb.KeyValueStore) {
  266. nfdb := &nofreezedb{KeyValueStore: db}
  267. var (
  268. backoff bool
  269. triggered chan struct{} // Used in tests
  270. )
  271. for {
  272. select {
  273. case <-f.quit:
  274. log.Info("Freezer shutting down")
  275. return
  276. default:
  277. }
  278. if backoff {
  279. // If we were doing a manual trigger, notify it
  280. if triggered != nil {
  281. triggered <- struct{}{}
  282. triggered = nil
  283. }
  284. select {
  285. case <-time.NewTimer(freezerRecheckInterval).C:
  286. backoff = false
  287. case triggered = <-f.trigger:
  288. backoff = false
  289. case <-f.quit:
  290. return
  291. }
  292. }
  293. // Retrieve the freezing threshold.
  294. hash := ReadHeadBlockHash(nfdb)
  295. if hash == (common.Hash{}) {
  296. log.Debug("Current full block hash unavailable") // new chain, empty database
  297. backoff = true
  298. continue
  299. }
  300. number := ReadHeaderNumber(nfdb, hash)
  301. threshold := atomic.LoadUint64(&f.threshold)
  302. switch {
  303. case number == nil:
  304. log.Error("Current full block number unavailable", "hash", hash)
  305. backoff = true
  306. continue
  307. case *number < threshold:
  308. log.Debug("Current full block not old enough", "number", *number, "hash", hash, "delay", threshold)
  309. backoff = true
  310. continue
  311. case *number-threshold <= f.frozen:
  312. log.Debug("Ancient blocks frozen already", "number", *number, "hash", hash, "frozen", f.frozen)
  313. backoff = true
  314. continue
  315. }
  316. head := ReadHeader(nfdb, hash, *number)
  317. if head == nil {
  318. log.Error("Current full block unavailable", "number", *number, "hash", hash)
  319. backoff = true
  320. continue
  321. }
  322. // Seems we have data ready to be frozen, process in usable batches
  323. limit := *number - threshold
  324. if limit-f.frozen > freezerBatchLimit {
  325. limit = f.frozen + freezerBatchLimit
  326. }
  327. var (
  328. start = time.Now()
  329. first = f.frozen
  330. ancients = make([]common.Hash, 0, limit-f.frozen)
  331. )
  332. for f.frozen <= limit {
  333. // Retrieves all the components of the canonical block
  334. hash := ReadCanonicalHash(nfdb, f.frozen)
  335. if hash == (common.Hash{}) {
  336. log.Error("Canonical hash missing, can't freeze", "number", f.frozen)
  337. break
  338. }
  339. header := ReadHeaderRLP(nfdb, hash, f.frozen)
  340. if len(header) == 0 {
  341. log.Error("Block header missing, can't freeze", "number", f.frozen, "hash", hash)
  342. break
  343. }
  344. body := ReadBodyRLP(nfdb, hash, f.frozen)
  345. if len(body) == 0 {
  346. log.Error("Block body missing, can't freeze", "number", f.frozen, "hash", hash)
  347. break
  348. }
  349. receipts := ReadReceiptsRLP(nfdb, hash, f.frozen)
  350. if len(receipts) == 0 {
  351. log.Error("Block receipts missing, can't freeze", "number", f.frozen, "hash", hash)
  352. break
  353. }
  354. td := ReadTdRLP(nfdb, hash, f.frozen)
  355. if len(td) == 0 {
  356. log.Error("Total difficulty missing, can't freeze", "number", f.frozen, "hash", hash)
  357. break
  358. }
  359. log.Trace("Deep froze ancient block", "number", f.frozen, "hash", hash)
  360. // Inject all the components into the relevant data tables
  361. if err := f.AppendAncient(f.frozen, hash[:], header, body, receipts, td); err != nil {
  362. break
  363. }
  364. ancients = append(ancients, hash)
  365. }
  366. // Batch of blocks have been frozen, flush them before wiping from leveldb
  367. if err := f.Sync(); err != nil {
  368. log.Crit("Failed to flush frozen tables", "err", err)
  369. }
  370. // Wipe out all data from the active database
  371. batch := db.NewBatch()
  372. for i := 0; i < len(ancients); i++ {
  373. // Always keep the genesis block in active database
  374. if first+uint64(i) != 0 {
  375. DeleteBlockWithoutNumber(batch, ancients[i], first+uint64(i))
  376. DeleteCanonicalHash(batch, first+uint64(i))
  377. }
  378. }
  379. if err := batch.Write(); err != nil {
  380. log.Crit("Failed to delete frozen canonical blocks", "err", err)
  381. }
  382. batch.Reset()
  383. // Wipe out side chains also and track dangling side chians
  384. var dangling []common.Hash
  385. for number := first; number < f.frozen; number++ {
  386. // Always keep the genesis block in active database
  387. if number != 0 {
  388. dangling = ReadAllHashes(db, number)
  389. for _, hash := range dangling {
  390. log.Trace("Deleting side chain", "number", number, "hash", hash)
  391. DeleteBlock(batch, hash, number)
  392. }
  393. }
  394. }
  395. if err := batch.Write(); err != nil {
  396. log.Crit("Failed to delete frozen side blocks", "err", err)
  397. }
  398. batch.Reset()
  399. // Step into the future and delete and dangling side chains
  400. if f.frozen > 0 {
  401. tip := f.frozen
  402. for len(dangling) > 0 {
  403. drop := make(map[common.Hash]struct{})
  404. for _, hash := range dangling {
  405. log.Debug("Dangling parent from freezer", "number", tip-1, "hash", hash)
  406. drop[hash] = struct{}{}
  407. }
  408. children := ReadAllHashes(db, tip)
  409. for i := 0; i < len(children); i++ {
  410. // Dig up the child and ensure it's dangling
  411. child := ReadHeader(nfdb, children[i], tip)
  412. if child == nil {
  413. log.Error("Missing dangling header", "number", tip, "hash", children[i])
  414. continue
  415. }
  416. if _, ok := drop[child.ParentHash]; !ok {
  417. children = append(children[:i], children[i+1:]...)
  418. i--
  419. continue
  420. }
  421. // Delete all block data associated with the child
  422. log.Debug("Deleting dangling block", "number", tip, "hash", children[i], "parent", child.ParentHash)
  423. DeleteBlock(batch, children[i], tip)
  424. }
  425. dangling = children
  426. tip++
  427. }
  428. if err := batch.Write(); err != nil {
  429. log.Crit("Failed to delete dangling side blocks", "err", err)
  430. }
  431. }
  432. // Log something friendly for the user
  433. context := []interface{}{
  434. "blocks", f.frozen - first, "elapsed", common.PrettyDuration(time.Since(start)), "number", f.frozen - 1,
  435. }
  436. if n := len(ancients); n > 0 {
  437. context = append(context, []interface{}{"hash", ancients[n-1]}...)
  438. }
  439. log.Info("Deep froze chain segment", context...)
  440. // Avoid database thrashing with tiny writes
  441. if f.frozen-first < freezerBatchLimit {
  442. backoff = true
  443. }
  444. }
  445. }
  446. // repair truncates all data tables to the same length.
  447. func (f *freezer) repair() error {
  448. min := uint64(math.MaxUint64)
  449. for _, table := range f.tables {
  450. items := atomic.LoadUint64(&table.items)
  451. if min > items {
  452. min = items
  453. }
  454. }
  455. for _, table := range f.tables {
  456. if err := table.truncate(min); err != nil {
  457. return err
  458. }
  459. }
  460. atomic.StoreUint64(&f.frozen, min)
  461. return nil
  462. }