freezer.go 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472
  1. // Copyright 2019 The go-ethereum Authors
  2. // This file is part of the go-ethereum library.
  3. //
  4. // The go-ethereum library is free software: you can redistribute it and/or modify
  5. // it under the terms of the GNU Lesser General Public License as published by
  6. // the Free Software Foundation, either version 3 of the License, or
  7. // (at your option) any later version.
  8. //
  9. // The go-ethereum library is distributed in the hope that it will be useful,
  10. // but WITHOUT ANY WARRANTY; without even the implied warranty of
  11. // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  12. // GNU Lesser General Public License for more details.
  13. //
  14. // You should have received a copy of the GNU Lesser General Public License
  15. // along with the go-ethereum library. If not, see <http://www.gnu.org/licenses/>.
  16. package rawdb
  17. import (
  18. "errors"
  19. "fmt"
  20. "math"
  21. "os"
  22. "path/filepath"
  23. "sync"
  24. "sync/atomic"
  25. "time"
  26. "github.com/ethereum/go-ethereum/common"
  27. "github.com/ethereum/go-ethereum/ethdb"
  28. "github.com/ethereum/go-ethereum/log"
  29. "github.com/ethereum/go-ethereum/metrics"
  30. "github.com/ethereum/go-ethereum/params"
  31. "github.com/prometheus/tsdb/fileutil"
  32. )
  33. var (
  34. // errUnknownTable is returned if the user attempts to read from a table that is
  35. // not tracked by the freezer.
  36. errUnknownTable = errors.New("unknown table")
  37. // errOutOrderInsertion is returned if the user attempts to inject out-of-order
  38. // binary blobs into the freezer.
  39. errOutOrderInsertion = errors.New("the append operation is out-order")
  40. // errSymlinkDatadir is returned if the ancient directory specified by user
  41. // is a symbolic link.
  42. errSymlinkDatadir = errors.New("symbolic link datadir is not supported")
  43. )
  44. const (
  45. // freezerRecheckInterval is the frequency to check the key-value database for
  46. // chain progression that might permit new blocks to be frozen into immutable
  47. // storage.
  48. freezerRecheckInterval = time.Minute
  49. // freezerBatchLimit is the maximum number of blocks to freeze in one batch
  50. // before doing an fsync and deleting it from the key-value store.
  51. freezerBatchLimit = 30000
  52. )
  53. // freezer is an memory mapped append-only database to store immutable chain data
  54. // into flat files:
  55. //
  56. // - The append only nature ensures that disk writes are minimized.
  57. // - The memory mapping ensures we can max out system memory for caching without
  58. // reserving it for go-ethereum. This would also reduce the memory requirements
  59. // of Geth, and thus also GC overhead.
  60. type freezer struct {
  61. // WARNING: The `frozen` field is accessed atomically. On 32 bit platforms, only
  62. // 64-bit aligned fields can be atomic. The struct is guaranteed to be so aligned,
  63. // so take advantage of that (https://golang.org/pkg/sync/atomic/#pkg-note-BUG).
  64. frozen uint64 // Number of blocks already frozen
  65. threshold uint64 // Number of recent blocks not to freeze (params.FullImmutabilityThreshold apart from tests)
  66. tables map[string]*freezerTable // Data tables for storing everything
  67. instanceLock fileutil.Releaser // File-system lock to prevent double opens
  68. trigger chan chan struct{} // Manual blocking freeze trigger, test determinism
  69. quit chan struct{}
  70. closeOnce sync.Once
  71. }
  72. // newFreezer creates a chain freezer that moves ancient chain data into
  73. // append-only flat file containers.
  74. func newFreezer(datadir string, namespace string) (*freezer, error) {
  75. // Create the initial freezer object
  76. var (
  77. readMeter = metrics.NewRegisteredMeter(namespace+"ancient/read", nil)
  78. writeMeter = metrics.NewRegisteredMeter(namespace+"ancient/write", nil)
  79. sizeGauge = metrics.NewRegisteredGauge(namespace+"ancient/size", nil)
  80. )
  81. // Ensure the datadir is not a symbolic link if it exists.
  82. if info, err := os.Lstat(datadir); !os.IsNotExist(err) {
  83. if info.Mode()&os.ModeSymlink != 0 {
  84. log.Warn("Symbolic link ancient database is not supported", "path", datadir)
  85. return nil, errSymlinkDatadir
  86. }
  87. }
  88. // Leveldb uses LOCK as the filelock filename. To prevent the
  89. // name collision, we use FLOCK as the lock name.
  90. lock, _, err := fileutil.Flock(filepath.Join(datadir, "FLOCK"))
  91. if err != nil {
  92. return nil, err
  93. }
  94. // Open all the supported data tables
  95. freezer := &freezer{
  96. threshold: params.FullImmutabilityThreshold,
  97. tables: make(map[string]*freezerTable),
  98. instanceLock: lock,
  99. trigger: make(chan chan struct{}),
  100. quit: make(chan struct{}),
  101. }
  102. for name, disableSnappy := range freezerNoSnappy {
  103. table, err := newTable(datadir, name, readMeter, writeMeter, sizeGauge, disableSnappy)
  104. if err != nil {
  105. for _, table := range freezer.tables {
  106. table.Close()
  107. }
  108. lock.Release()
  109. return nil, err
  110. }
  111. freezer.tables[name] = table
  112. }
  113. if err := freezer.repair(); err != nil {
  114. for _, table := range freezer.tables {
  115. table.Close()
  116. }
  117. lock.Release()
  118. return nil, err
  119. }
  120. log.Info("Opened ancient database", "database", datadir)
  121. return freezer, nil
  122. }
  123. // Close terminates the chain freezer, unmapping all the data files.
  124. func (f *freezer) Close() error {
  125. var errs []error
  126. f.closeOnce.Do(func() {
  127. f.quit <- struct{}{}
  128. for _, table := range f.tables {
  129. if err := table.Close(); err != nil {
  130. errs = append(errs, err)
  131. }
  132. }
  133. if err := f.instanceLock.Release(); err != nil {
  134. errs = append(errs, err)
  135. }
  136. })
  137. if errs != nil {
  138. return fmt.Errorf("%v", errs)
  139. }
  140. return nil
  141. }
  142. // HasAncient returns an indicator whether the specified ancient data exists
  143. // in the freezer.
  144. func (f *freezer) HasAncient(kind string, number uint64) (bool, error) {
  145. if table := f.tables[kind]; table != nil {
  146. return table.has(number), nil
  147. }
  148. return false, nil
  149. }
  150. // Ancient retrieves an ancient binary blob from the append-only immutable files.
  151. func (f *freezer) Ancient(kind string, number uint64) ([]byte, error) {
  152. if table := f.tables[kind]; table != nil {
  153. return table.Retrieve(number)
  154. }
  155. return nil, errUnknownTable
  156. }
  157. // Ancients returns the length of the frozen items.
  158. func (f *freezer) Ancients() (uint64, error) {
  159. return atomic.LoadUint64(&f.frozen), nil
  160. }
  161. // AncientSize returns the ancient size of the specified category.
  162. func (f *freezer) AncientSize(kind string) (uint64, error) {
  163. if table := f.tables[kind]; table != nil {
  164. return table.size()
  165. }
  166. return 0, errUnknownTable
  167. }
  168. // AppendAncient injects all binary blobs belong to block at the end of the
  169. // append-only immutable table files.
  170. //
  171. // Notably, this function is lock free but kind of thread-safe. All out-of-order
  172. // injection will be rejected. But if two injections with same number happen at
  173. // the same time, we can get into the trouble.
  174. func (f *freezer) AppendAncient(number uint64, hash, header, body, receipts, td []byte) (err error) {
  175. // Ensure the binary blobs we are appending is continuous with freezer.
  176. if atomic.LoadUint64(&f.frozen) != number {
  177. return errOutOrderInsertion
  178. }
  179. // Rollback all inserted data if any insertion below failed to ensure
  180. // the tables won't out of sync.
  181. defer func() {
  182. if err != nil {
  183. rerr := f.repair()
  184. if rerr != nil {
  185. log.Crit("Failed to repair freezer", "err", rerr)
  186. }
  187. log.Info("Append ancient failed", "number", number, "err", err)
  188. }
  189. }()
  190. // Inject all the components into the relevant data tables
  191. if err := f.tables[freezerHashTable].Append(f.frozen, hash[:]); err != nil {
  192. log.Error("Failed to append ancient hash", "number", f.frozen, "hash", hash, "err", err)
  193. return err
  194. }
  195. if err := f.tables[freezerHeaderTable].Append(f.frozen, header); err != nil {
  196. log.Error("Failed to append ancient header", "number", f.frozen, "hash", hash, "err", err)
  197. return err
  198. }
  199. if err := f.tables[freezerBodiesTable].Append(f.frozen, body); err != nil {
  200. log.Error("Failed to append ancient body", "number", f.frozen, "hash", hash, "err", err)
  201. return err
  202. }
  203. if err := f.tables[freezerReceiptTable].Append(f.frozen, receipts); err != nil {
  204. log.Error("Failed to append ancient receipts", "number", f.frozen, "hash", hash, "err", err)
  205. return err
  206. }
  207. if err := f.tables[freezerDifficultyTable].Append(f.frozen, td); err != nil {
  208. log.Error("Failed to append ancient difficulty", "number", f.frozen, "hash", hash, "err", err)
  209. return err
  210. }
  211. atomic.AddUint64(&f.frozen, 1) // Only modify atomically
  212. return nil
  213. }
  214. // TruncateAncients discards any recent data above the provided threshold number.
  215. func (f *freezer) TruncateAncients(items uint64) error {
  216. if atomic.LoadUint64(&f.frozen) <= items {
  217. return nil
  218. }
  219. for _, table := range f.tables {
  220. if err := table.truncate(items); err != nil {
  221. return err
  222. }
  223. }
  224. atomic.StoreUint64(&f.frozen, items)
  225. return nil
  226. }
  227. // Sync flushes all data tables to disk.
  228. func (f *freezer) Sync() error {
  229. var errs []error
  230. for _, table := range f.tables {
  231. if err := table.Sync(); err != nil {
  232. errs = append(errs, err)
  233. }
  234. }
  235. if errs != nil {
  236. return fmt.Errorf("%v", errs)
  237. }
  238. return nil
  239. }
  240. // freeze is a background thread that periodically checks the blockchain for any
  241. // import progress and moves ancient data from the fast database into the freezer.
  242. //
  243. // This functionality is deliberately broken off from block importing to avoid
  244. // incurring additional data shuffling delays on block propagation.
  245. func (f *freezer) freeze(db ethdb.KeyValueStore) {
  246. nfdb := &nofreezedb{KeyValueStore: db}
  247. var (
  248. backoff bool
  249. triggered chan struct{} // Used in tests
  250. )
  251. for {
  252. select {
  253. case <-f.quit:
  254. log.Info("Freezer shutting down")
  255. return
  256. default:
  257. }
  258. if backoff {
  259. // If we were doing a manual trigger, notify it
  260. if triggered != nil {
  261. triggered <- struct{}{}
  262. triggered = nil
  263. }
  264. select {
  265. case <-time.NewTimer(freezerRecheckInterval).C:
  266. backoff = false
  267. case triggered = <-f.trigger:
  268. backoff = false
  269. case <-f.quit:
  270. return
  271. }
  272. }
  273. // Retrieve the freezing threshold.
  274. hash := ReadHeadBlockHash(nfdb)
  275. if hash == (common.Hash{}) {
  276. log.Debug("Current full block hash unavailable") // new chain, empty database
  277. backoff = true
  278. continue
  279. }
  280. number := ReadHeaderNumber(nfdb, hash)
  281. threshold := atomic.LoadUint64(&f.threshold)
  282. switch {
  283. case number == nil:
  284. log.Error("Current full block number unavailable", "hash", hash)
  285. backoff = true
  286. continue
  287. case *number < threshold:
  288. log.Debug("Current full block not old enough", "number", *number, "hash", hash, "delay", threshold)
  289. backoff = true
  290. continue
  291. case *number-threshold <= f.frozen:
  292. log.Debug("Ancient blocks frozen already", "number", *number, "hash", hash, "frozen", f.frozen)
  293. backoff = true
  294. continue
  295. }
  296. head := ReadHeader(nfdb, hash, *number)
  297. if head == nil {
  298. log.Error("Current full block unavailable", "number", *number, "hash", hash)
  299. backoff = true
  300. continue
  301. }
  302. // Seems we have data ready to be frozen, process in usable batches
  303. limit := *number - threshold
  304. if limit-f.frozen > freezerBatchLimit {
  305. limit = f.frozen + freezerBatchLimit
  306. }
  307. var (
  308. start = time.Now()
  309. first = f.frozen
  310. ancients = make([]common.Hash, 0, limit-f.frozen)
  311. )
  312. for f.frozen <= limit {
  313. // Retrieves all the components of the canonical block
  314. hash := ReadCanonicalHash(nfdb, f.frozen)
  315. if hash == (common.Hash{}) {
  316. log.Error("Canonical hash missing, can't freeze", "number", f.frozen)
  317. break
  318. }
  319. header := ReadHeaderRLP(nfdb, hash, f.frozen)
  320. if len(header) == 0 {
  321. log.Error("Block header missing, can't freeze", "number", f.frozen, "hash", hash)
  322. break
  323. }
  324. body := ReadBodyRLP(nfdb, hash, f.frozen)
  325. if len(body) == 0 {
  326. log.Error("Block body missing, can't freeze", "number", f.frozen, "hash", hash)
  327. break
  328. }
  329. receipts := ReadReceiptsRLP(nfdb, hash, f.frozen)
  330. if len(receipts) == 0 {
  331. log.Error("Block receipts missing, can't freeze", "number", f.frozen, "hash", hash)
  332. break
  333. }
  334. td := ReadTdRLP(nfdb, hash, f.frozen)
  335. if len(td) == 0 {
  336. log.Error("Total difficulty missing, can't freeze", "number", f.frozen, "hash", hash)
  337. break
  338. }
  339. log.Trace("Deep froze ancient block", "number", f.frozen, "hash", hash)
  340. // Inject all the components into the relevant data tables
  341. if err := f.AppendAncient(f.frozen, hash[:], header, body, receipts, td); err != nil {
  342. break
  343. }
  344. ancients = append(ancients, hash)
  345. }
  346. // Batch of blocks have been frozen, flush them before wiping from leveldb
  347. if err := f.Sync(); err != nil {
  348. log.Crit("Failed to flush frozen tables", "err", err)
  349. }
  350. // Wipe out all data from the active database
  351. batch := db.NewBatch()
  352. for i := 0; i < len(ancients); i++ {
  353. // Always keep the genesis block in active database
  354. if first+uint64(i) != 0 {
  355. DeleteBlockWithoutNumber(batch, ancients[i], first+uint64(i))
  356. DeleteCanonicalHash(batch, first+uint64(i))
  357. }
  358. }
  359. if err := batch.Write(); err != nil {
  360. log.Crit("Failed to delete frozen canonical blocks", "err", err)
  361. }
  362. batch.Reset()
  363. // Wipe out side chains also and track dangling side chians
  364. var dangling []common.Hash
  365. for number := first; number < f.frozen; number++ {
  366. // Always keep the genesis block in active database
  367. if number != 0 {
  368. dangling = ReadAllHashes(db, number)
  369. for _, hash := range dangling {
  370. log.Trace("Deleting side chain", "number", number, "hash", hash)
  371. DeleteBlock(batch, hash, number)
  372. }
  373. }
  374. }
  375. if err := batch.Write(); err != nil {
  376. log.Crit("Failed to delete frozen side blocks", "err", err)
  377. }
  378. batch.Reset()
  379. // Step into the future and delete and dangling side chains
  380. if f.frozen > 0 {
  381. tip := f.frozen
  382. for len(dangling) > 0 {
  383. drop := make(map[common.Hash]struct{})
  384. for _, hash := range dangling {
  385. log.Debug("Dangling parent from freezer", "number", tip-1, "hash", hash)
  386. drop[hash] = struct{}{}
  387. }
  388. children := ReadAllHashes(db, tip)
  389. for i := 0; i < len(children); i++ {
  390. // Dig up the child and ensure it's dangling
  391. child := ReadHeader(nfdb, children[i], tip)
  392. if child == nil {
  393. log.Error("Missing dangling header", "number", tip, "hash", children[i])
  394. continue
  395. }
  396. if _, ok := drop[child.ParentHash]; !ok {
  397. children = append(children[:i], children[i+1:]...)
  398. i--
  399. continue
  400. }
  401. // Delete all block data associated with the child
  402. log.Debug("Deleting dangling block", "number", tip, "hash", children[i], "parent", child.ParentHash)
  403. DeleteBlock(batch, children[i], tip)
  404. }
  405. dangling = children
  406. tip++
  407. }
  408. if err := batch.Write(); err != nil {
  409. log.Crit("Failed to delete dangling side blocks", "err", err)
  410. }
  411. }
  412. // Log something friendly for the user
  413. context := []interface{}{
  414. "blocks", f.frozen - first, "elapsed", common.PrettyDuration(time.Since(start)), "number", f.frozen - 1,
  415. }
  416. if n := len(ancients); n > 0 {
  417. context = append(context, []interface{}{"hash", ancients[n-1]}...)
  418. }
  419. log.Info("Deep froze chain segment", context...)
  420. // Avoid database thrashing with tiny writes
  421. if f.frozen-first < freezerBatchLimit {
  422. backoff = true
  423. }
  424. }
  425. }
  426. // repair truncates all data tables to the same length.
  427. func (f *freezer) repair() error {
  428. min := uint64(math.MaxUint64)
  429. for _, table := range f.tables {
  430. items := atomic.LoadUint64(&table.items)
  431. if min > items {
  432. min = items
  433. }
  434. }
  435. for _, table := range f.tables {
  436. if err := table.truncate(min); err != nil {
  437. return err
  438. }
  439. }
  440. atomic.StoreUint64(&f.frozen, min)
  441. return nil
  442. }