freezer.go 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484
  1. // Copyright 2019 The go-ethereum Authors
  2. // This file is part of the go-ethereum library.
  3. //
  4. // The go-ethereum library is free software: you can redistribute it and/or modify
  5. // it under the terms of the GNU Lesser General Public License as published by
  6. // the Free Software Foundation, either version 3 of the License, or
  7. // (at your option) any later version.
  8. //
  9. // The go-ethereum library is distributed in the hope that it will be useful,
  10. // but WITHOUT ANY WARRANTY; without even the implied warranty of
  11. // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  12. // GNU Lesser General Public License for more details.
  13. //
  14. // You should have received a copy of the GNU Lesser General Public License
  15. // along with the go-ethereum library. If not, see <http://www.gnu.org/licenses/>.
  16. package rawdb
  17. import (
  18. "errors"
  19. "fmt"
  20. "math"
  21. "os"
  22. "path/filepath"
  23. "sync"
  24. "sync/atomic"
  25. "time"
  26. "github.com/ethereum/go-ethereum/common"
  27. "github.com/ethereum/go-ethereum/ethdb"
  28. "github.com/ethereum/go-ethereum/log"
  29. "github.com/ethereum/go-ethereum/metrics"
  30. "github.com/ethereum/go-ethereum/params"
  31. "github.com/prometheus/tsdb/fileutil"
  32. )
  33. var (
  34. // errReadOnly is returned if the freezer is opened in read only mode. All the
  35. // mutations are disallowed.
  36. errReadOnly = errors.New("read only")
  37. // errUnknownTable is returned if the user attempts to read from a table that is
  38. // not tracked by the freezer.
  39. errUnknownTable = errors.New("unknown table")
  40. // errOutOrderInsertion is returned if the user attempts to inject out-of-order
  41. // binary blobs into the freezer.
  42. errOutOrderInsertion = errors.New("the append operation is out-order")
  43. // errSymlinkDatadir is returned if the ancient directory specified by user
  44. // is a symbolic link.
  45. errSymlinkDatadir = errors.New("symbolic link datadir is not supported")
  46. )
  47. const (
  48. // freezerRecheckInterval is the frequency to check the key-value database for
  49. // chain progression that might permit new blocks to be frozen into immutable
  50. // storage.
  51. freezerRecheckInterval = time.Minute
  52. // freezerBatchLimit is the maximum number of blocks to freeze in one batch
  53. // before doing an fsync and deleting it from the key-value store.
  54. freezerBatchLimit = 30000
  55. )
  56. // freezer is an memory mapped append-only database to store immutable chain data
  57. // into flat files:
  58. //
  59. // - The append only nature ensures that disk writes are minimized.
  60. // - The memory mapping ensures we can max out system memory for caching without
  61. // reserving it for go-ethereum. This would also reduce the memory requirements
  62. // of Geth, and thus also GC overhead.
  63. type freezer struct {
  64. // WARNING: The `frozen` field is accessed atomically. On 32 bit platforms, only
  65. // 64-bit aligned fields can be atomic. The struct is guaranteed to be so aligned,
  66. // so take advantage of that (https://golang.org/pkg/sync/atomic/#pkg-note-BUG).
  67. frozen uint64 // Number of blocks already frozen
  68. threshold uint64 // Number of recent blocks not to freeze (params.FullImmutabilityThreshold apart from tests)
  69. readonly bool
  70. tables map[string]*freezerTable // Data tables for storing everything
  71. instanceLock fileutil.Releaser // File-system lock to prevent double opens
  72. trigger chan chan struct{} // Manual blocking freeze trigger, test determinism
  73. quit chan struct{}
  74. closeOnce sync.Once
  75. }
  76. // newFreezer creates a chain freezer that moves ancient chain data into
  77. // append-only flat file containers.
  78. func newFreezer(datadir string, namespace string, readonly bool) (*freezer, error) {
  79. // Create the initial freezer object
  80. var (
  81. readMeter = metrics.NewRegisteredMeter(namespace+"ancient/read", nil)
  82. writeMeter = metrics.NewRegisteredMeter(namespace+"ancient/write", nil)
  83. sizeGauge = metrics.NewRegisteredGauge(namespace+"ancient/size", nil)
  84. )
  85. // Ensure the datadir is not a symbolic link if it exists.
  86. if info, err := os.Lstat(datadir); !os.IsNotExist(err) {
  87. if info.Mode()&os.ModeSymlink != 0 {
  88. log.Warn("Symbolic link ancient database is not supported", "path", datadir)
  89. return nil, errSymlinkDatadir
  90. }
  91. }
  92. // Leveldb uses LOCK as the filelock filename. To prevent the
  93. // name collision, we use FLOCK as the lock name.
  94. lock, _, err := fileutil.Flock(filepath.Join(datadir, "FLOCK"))
  95. if err != nil {
  96. return nil, err
  97. }
  98. // Open all the supported data tables
  99. freezer := &freezer{
  100. readonly: readonly,
  101. threshold: params.FullImmutabilityThreshold,
  102. tables: make(map[string]*freezerTable),
  103. instanceLock: lock,
  104. trigger: make(chan chan struct{}),
  105. quit: make(chan struct{}),
  106. }
  107. for name, disableSnappy := range FreezerNoSnappy {
  108. table, err := newTable(datadir, name, readMeter, writeMeter, sizeGauge, disableSnappy)
  109. if err != nil {
  110. for _, table := range freezer.tables {
  111. table.Close()
  112. }
  113. lock.Release()
  114. return nil, err
  115. }
  116. freezer.tables[name] = table
  117. }
  118. if err := freezer.repair(); err != nil {
  119. for _, table := range freezer.tables {
  120. table.Close()
  121. }
  122. lock.Release()
  123. return nil, err
  124. }
  125. log.Info("Opened ancient database", "database", datadir, "readonly", readonly)
  126. return freezer, nil
  127. }
  128. // Close terminates the chain freezer, unmapping all the data files.
  129. func (f *freezer) Close() error {
  130. var errs []error
  131. f.closeOnce.Do(func() {
  132. close(f.quit)
  133. for _, table := range f.tables {
  134. if err := table.Close(); err != nil {
  135. errs = append(errs, err)
  136. }
  137. }
  138. if err := f.instanceLock.Release(); err != nil {
  139. errs = append(errs, err)
  140. }
  141. })
  142. if errs != nil {
  143. return fmt.Errorf("%v", errs)
  144. }
  145. return nil
  146. }
  147. // HasAncient returns an indicator whether the specified ancient data exists
  148. // in the freezer.
  149. func (f *freezer) HasAncient(kind string, number uint64) (bool, error) {
  150. if table := f.tables[kind]; table != nil {
  151. return table.has(number), nil
  152. }
  153. return false, nil
  154. }
  155. // Ancient retrieves an ancient binary blob from the append-only immutable files.
  156. func (f *freezer) Ancient(kind string, number uint64) ([]byte, error) {
  157. if table := f.tables[kind]; table != nil {
  158. return table.Retrieve(number)
  159. }
  160. return nil, errUnknownTable
  161. }
  162. // Ancients returns the length of the frozen items.
  163. func (f *freezer) Ancients() (uint64, error) {
  164. return atomic.LoadUint64(&f.frozen), nil
  165. }
  166. // AncientSize returns the ancient size of the specified category.
  167. func (f *freezer) AncientSize(kind string) (uint64, error) {
  168. if table := f.tables[kind]; table != nil {
  169. return table.size()
  170. }
  171. return 0, errUnknownTable
  172. }
  173. // AppendAncient injects all binary blobs belong to block at the end of the
  174. // append-only immutable table files.
  175. //
  176. // Notably, this function is lock free but kind of thread-safe. All out-of-order
  177. // injection will be rejected. But if two injections with same number happen at
  178. // the same time, we can get into the trouble.
  179. func (f *freezer) AppendAncient(number uint64, hash, header, body, receipts, td []byte) (err error) {
  180. if f.readonly {
  181. return errReadOnly
  182. }
  183. // Ensure the binary blobs we are appending is continuous with freezer.
  184. if atomic.LoadUint64(&f.frozen) != number {
  185. return errOutOrderInsertion
  186. }
  187. // Rollback all inserted data if any insertion below failed to ensure
  188. // the tables won't out of sync.
  189. defer func() {
  190. if err != nil {
  191. rerr := f.repair()
  192. if rerr != nil {
  193. log.Crit("Failed to repair freezer", "err", rerr)
  194. }
  195. log.Info("Append ancient failed", "number", number, "err", err)
  196. }
  197. }()
  198. // Inject all the components into the relevant data tables
  199. if err := f.tables[freezerHashTable].Append(f.frozen, hash[:]); err != nil {
  200. log.Error("Failed to append ancient hash", "number", f.frozen, "hash", hash, "err", err)
  201. return err
  202. }
  203. if err := f.tables[freezerHeaderTable].Append(f.frozen, header); err != nil {
  204. log.Error("Failed to append ancient header", "number", f.frozen, "hash", hash, "err", err)
  205. return err
  206. }
  207. if err := f.tables[freezerBodiesTable].Append(f.frozen, body); err != nil {
  208. log.Error("Failed to append ancient body", "number", f.frozen, "hash", hash, "err", err)
  209. return err
  210. }
  211. if err := f.tables[freezerReceiptTable].Append(f.frozen, receipts); err != nil {
  212. log.Error("Failed to append ancient receipts", "number", f.frozen, "hash", hash, "err", err)
  213. return err
  214. }
  215. if err := f.tables[freezerDifficultyTable].Append(f.frozen, td); err != nil {
  216. log.Error("Failed to append ancient difficulty", "number", f.frozen, "hash", hash, "err", err)
  217. return err
  218. }
  219. atomic.AddUint64(&f.frozen, 1) // Only modify atomically
  220. return nil
  221. }
  222. // TruncateAncients discards any recent data above the provided threshold number.
  223. func (f *freezer) TruncateAncients(items uint64) error {
  224. if f.readonly {
  225. return errReadOnly
  226. }
  227. if atomic.LoadUint64(&f.frozen) <= items {
  228. return nil
  229. }
  230. for _, table := range f.tables {
  231. if err := table.truncate(items); err != nil {
  232. return err
  233. }
  234. }
  235. atomic.StoreUint64(&f.frozen, items)
  236. return nil
  237. }
  238. // Sync flushes all data tables to disk.
  239. func (f *freezer) Sync() error {
  240. var errs []error
  241. for _, table := range f.tables {
  242. if err := table.Sync(); err != nil {
  243. errs = append(errs, err)
  244. }
  245. }
  246. if errs != nil {
  247. return fmt.Errorf("%v", errs)
  248. }
  249. return nil
  250. }
  251. // freeze is a background thread that periodically checks the blockchain for any
  252. // import progress and moves ancient data from the fast database into the freezer.
  253. //
  254. // This functionality is deliberately broken off from block importing to avoid
  255. // incurring additional data shuffling delays on block propagation.
  256. func (f *freezer) freeze(db ethdb.KeyValueStore) {
  257. nfdb := &nofreezedb{KeyValueStore: db}
  258. var (
  259. backoff bool
  260. triggered chan struct{} // Used in tests
  261. )
  262. for {
  263. select {
  264. case <-f.quit:
  265. log.Info("Freezer shutting down")
  266. return
  267. default:
  268. }
  269. if backoff {
  270. // If we were doing a manual trigger, notify it
  271. if triggered != nil {
  272. triggered <- struct{}{}
  273. triggered = nil
  274. }
  275. select {
  276. case <-time.NewTimer(freezerRecheckInterval).C:
  277. backoff = false
  278. case triggered = <-f.trigger:
  279. backoff = false
  280. case <-f.quit:
  281. return
  282. }
  283. }
  284. // Retrieve the freezing threshold.
  285. hash := ReadHeadBlockHash(nfdb)
  286. if hash == (common.Hash{}) {
  287. log.Debug("Current full block hash unavailable") // new chain, empty database
  288. backoff = true
  289. continue
  290. }
  291. number := ReadHeaderNumber(nfdb, hash)
  292. threshold := atomic.LoadUint64(&f.threshold)
  293. switch {
  294. case number == nil:
  295. log.Error("Current full block number unavailable", "hash", hash)
  296. backoff = true
  297. continue
  298. case *number < threshold:
  299. log.Debug("Current full block not old enough", "number", *number, "hash", hash, "delay", threshold)
  300. backoff = true
  301. continue
  302. case *number-threshold <= f.frozen:
  303. log.Debug("Ancient blocks frozen already", "number", *number, "hash", hash, "frozen", f.frozen)
  304. backoff = true
  305. continue
  306. }
  307. head := ReadHeader(nfdb, hash, *number)
  308. if head == nil {
  309. log.Error("Current full block unavailable", "number", *number, "hash", hash)
  310. backoff = true
  311. continue
  312. }
  313. // Seems we have data ready to be frozen, process in usable batches
  314. limit := *number - threshold
  315. if limit-f.frozen > freezerBatchLimit {
  316. limit = f.frozen + freezerBatchLimit
  317. }
  318. var (
  319. start = time.Now()
  320. first = f.frozen
  321. ancients = make([]common.Hash, 0, limit-f.frozen)
  322. )
  323. for f.frozen <= limit {
  324. // Retrieves all the components of the canonical block
  325. hash := ReadCanonicalHash(nfdb, f.frozen)
  326. if hash == (common.Hash{}) {
  327. log.Error("Canonical hash missing, can't freeze", "number", f.frozen)
  328. break
  329. }
  330. header := ReadHeaderRLP(nfdb, hash, f.frozen)
  331. if len(header) == 0 {
  332. log.Error("Block header missing, can't freeze", "number", f.frozen, "hash", hash)
  333. break
  334. }
  335. body := ReadBodyRLP(nfdb, hash, f.frozen)
  336. if len(body) == 0 {
  337. log.Error("Block body missing, can't freeze", "number", f.frozen, "hash", hash)
  338. break
  339. }
  340. receipts := ReadReceiptsRLP(nfdb, hash, f.frozen)
  341. if len(receipts) == 0 {
  342. log.Error("Block receipts missing, can't freeze", "number", f.frozen, "hash", hash)
  343. break
  344. }
  345. td := ReadTdRLP(nfdb, hash, f.frozen)
  346. if len(td) == 0 {
  347. log.Error("Total difficulty missing, can't freeze", "number", f.frozen, "hash", hash)
  348. break
  349. }
  350. log.Trace("Deep froze ancient block", "number", f.frozen, "hash", hash)
  351. // Inject all the components into the relevant data tables
  352. if err := f.AppendAncient(f.frozen, hash[:], header, body, receipts, td); err != nil {
  353. break
  354. }
  355. ancients = append(ancients, hash)
  356. }
  357. // Batch of blocks have been frozen, flush them before wiping from leveldb
  358. if err := f.Sync(); err != nil {
  359. log.Crit("Failed to flush frozen tables", "err", err)
  360. }
  361. // Wipe out all data from the active database
  362. batch := db.NewBatch()
  363. for i := 0; i < len(ancients); i++ {
  364. // Always keep the genesis block in active database
  365. if first+uint64(i) != 0 {
  366. DeleteBlockWithoutNumber(batch, ancients[i], first+uint64(i))
  367. DeleteCanonicalHash(batch, first+uint64(i))
  368. }
  369. }
  370. if err := batch.Write(); err != nil {
  371. log.Crit("Failed to delete frozen canonical blocks", "err", err)
  372. }
  373. batch.Reset()
  374. // Wipe out side chains also and track dangling side chians
  375. var dangling []common.Hash
  376. for number := first; number < f.frozen; number++ {
  377. // Always keep the genesis block in active database
  378. if number != 0 {
  379. dangling = ReadAllHashes(db, number)
  380. for _, hash := range dangling {
  381. log.Trace("Deleting side chain", "number", number, "hash", hash)
  382. DeleteBlock(batch, hash, number)
  383. }
  384. }
  385. }
  386. if err := batch.Write(); err != nil {
  387. log.Crit("Failed to delete frozen side blocks", "err", err)
  388. }
  389. batch.Reset()
  390. // Step into the future and delete and dangling side chains
  391. if f.frozen > 0 {
  392. tip := f.frozen
  393. for len(dangling) > 0 {
  394. drop := make(map[common.Hash]struct{})
  395. for _, hash := range dangling {
  396. log.Debug("Dangling parent from freezer", "number", tip-1, "hash", hash)
  397. drop[hash] = struct{}{}
  398. }
  399. children := ReadAllHashes(db, tip)
  400. for i := 0; i < len(children); i++ {
  401. // Dig up the child and ensure it's dangling
  402. child := ReadHeader(nfdb, children[i], tip)
  403. if child == nil {
  404. log.Error("Missing dangling header", "number", tip, "hash", children[i])
  405. continue
  406. }
  407. if _, ok := drop[child.ParentHash]; !ok {
  408. children = append(children[:i], children[i+1:]...)
  409. i--
  410. continue
  411. }
  412. // Delete all block data associated with the child
  413. log.Debug("Deleting dangling block", "number", tip, "hash", children[i], "parent", child.ParentHash)
  414. DeleteBlock(batch, children[i], tip)
  415. }
  416. dangling = children
  417. tip++
  418. }
  419. if err := batch.Write(); err != nil {
  420. log.Crit("Failed to delete dangling side blocks", "err", err)
  421. }
  422. }
  423. // Log something friendly for the user
  424. context := []interface{}{
  425. "blocks", f.frozen - first, "elapsed", common.PrettyDuration(time.Since(start)), "number", f.frozen - 1,
  426. }
  427. if n := len(ancients); n > 0 {
  428. context = append(context, []interface{}{"hash", ancients[n-1]}...)
  429. }
  430. log.Info("Deep froze chain segment", context...)
  431. // Avoid database thrashing with tiny writes
  432. if f.frozen-first < freezerBatchLimit {
  433. backoff = true
  434. }
  435. }
  436. }
  437. // repair truncates all data tables to the same length.
  438. func (f *freezer) repair() error {
  439. min := uint64(math.MaxUint64)
  440. for _, table := range f.tables {
  441. items := atomic.LoadUint64(&table.items)
  442. if min > items {
  443. min = items
  444. }
  445. }
  446. for _, table := range f.tables {
  447. if err := table.truncate(min); err != nil {
  448. return err
  449. }
  450. }
  451. atomic.StoreUint64(&f.frozen, min)
  452. return nil
  453. }