database.go 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466
  1. // Copyright 2014 The go-ethereum Authors
  2. // This file is part of the go-ethereum library.
  3. //
  4. // The go-ethereum library is free software: you can redistribute it and/or modify
  5. // it under the terms of the GNU Lesser General Public License as published by
  6. // the Free Software Foundation, either version 3 of the License, or
  7. // (at your option) any later version.
  8. //
  9. // The go-ethereum library is distributed in the hope that it will be useful,
  10. // but WITHOUT ANY WARRANTY; without even the implied warranty of
  11. // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  12. // GNU Lesser General Public License for more details.
  13. //
  14. // You should have received a copy of the GNU Lesser General Public License
  15. // along with the go-ethereum library. If not, see <http://www.gnu.org/licenses/>.
  16. package ethdb
  17. import (
  18. "fmt"
  19. "strconv"
  20. "strings"
  21. "sync"
  22. "time"
  23. "github.com/ethereum/go-ethereum/log"
  24. "github.com/ethereum/go-ethereum/metrics"
  25. "github.com/syndtr/goleveldb/leveldb"
  26. "github.com/syndtr/goleveldb/leveldb/errors"
  27. "github.com/syndtr/goleveldb/leveldb/filter"
  28. "github.com/syndtr/goleveldb/leveldb/iterator"
  29. "github.com/syndtr/goleveldb/leveldb/opt"
  30. "github.com/syndtr/goleveldb/leveldb/util"
  31. )
  32. const (
  33. writeDelayNThreshold = 200
  34. writeDelayThreshold = 350 * time.Millisecond
  35. writeDelayWarningThrottler = 1 * time.Minute
  36. )
  37. var OpenFileLimit = 64
  38. type LDBDatabase struct {
  39. fn string // filename for reporting
  40. db *leveldb.DB // LevelDB instance
  41. compTimeMeter metrics.Meter // Meter for measuring the total time spent in database compaction
  42. compReadMeter metrics.Meter // Meter for measuring the data read during compaction
  43. compWriteMeter metrics.Meter // Meter for measuring the data written during compaction
  44. writeDelayNMeter metrics.Meter // Meter for measuring the write delay number due to database compaction
  45. writeDelayMeter metrics.Meter // Meter for measuring the write delay duration due to database compaction
  46. diskReadMeter metrics.Meter // Meter for measuring the effective amount of data read
  47. diskWriteMeter metrics.Meter // Meter for measuring the effective amount of data written
  48. quitLock sync.Mutex // Mutex protecting the quit channel access
  49. quitChan chan chan error // Quit channel to stop the metrics collection before closing the database
  50. log log.Logger // Contextual logger tracking the database path
  51. }
  52. // NewLDBDatabase returns a LevelDB wrapped object.
  53. func NewLDBDatabase(file string, cache int, handles int) (*LDBDatabase, error) {
  54. logger := log.New("database", file)
  55. // Ensure we have some minimal caching and file guarantees
  56. if cache < 16 {
  57. cache = 16
  58. }
  59. if handles < 16 {
  60. handles = 16
  61. }
  62. logger.Info("Allocated cache and file handles", "cache", cache, "handles", handles)
  63. // Open the db and recover any potential corruptions
  64. db, err := leveldb.OpenFile(file, &opt.Options{
  65. OpenFilesCacheCapacity: handles,
  66. BlockCacheCapacity: cache / 2 * opt.MiB,
  67. WriteBuffer: cache / 4 * opt.MiB, // Two of these are used internally
  68. Filter: filter.NewBloomFilter(10),
  69. })
  70. if _, corrupted := err.(*errors.ErrCorrupted); corrupted {
  71. db, err = leveldb.RecoverFile(file, nil)
  72. }
  73. // (Re)check for errors and abort if opening of the db failed
  74. if err != nil {
  75. return nil, err
  76. }
  77. return &LDBDatabase{
  78. fn: file,
  79. db: db,
  80. log: logger,
  81. }, nil
  82. }
  83. // Path returns the path to the database directory.
  84. func (db *LDBDatabase) Path() string {
  85. return db.fn
  86. }
  87. // Put puts the given key / value to the queue
  88. func (db *LDBDatabase) Put(key []byte, value []byte) error {
  89. return db.db.Put(key, value, nil)
  90. }
  91. func (db *LDBDatabase) Has(key []byte) (bool, error) {
  92. return db.db.Has(key, nil)
  93. }
  94. // Get returns the given key if it's present.
  95. func (db *LDBDatabase) Get(key []byte) ([]byte, error) {
  96. dat, err := db.db.Get(key, nil)
  97. if err != nil {
  98. return nil, err
  99. }
  100. return dat, nil
  101. }
  102. // Delete deletes the key from the queue and database
  103. func (db *LDBDatabase) Delete(key []byte) error {
  104. return db.db.Delete(key, nil)
  105. }
  106. func (db *LDBDatabase) NewIterator() iterator.Iterator {
  107. return db.db.NewIterator(nil, nil)
  108. }
  109. // NewIteratorWithPrefix returns a iterator to iterate over subset of database content with a particular prefix.
  110. func (db *LDBDatabase) NewIteratorWithPrefix(prefix []byte) iterator.Iterator {
  111. return db.db.NewIterator(util.BytesPrefix(prefix), nil)
  112. }
  113. func (db *LDBDatabase) Close() {
  114. // Stop the metrics collection to avoid internal database races
  115. db.quitLock.Lock()
  116. defer db.quitLock.Unlock()
  117. if db.quitChan != nil {
  118. errc := make(chan error)
  119. db.quitChan <- errc
  120. if err := <-errc; err != nil {
  121. db.log.Error("Metrics collection failed", "err", err)
  122. }
  123. db.quitChan = nil
  124. }
  125. err := db.db.Close()
  126. if err == nil {
  127. db.log.Info("Database closed")
  128. } else {
  129. db.log.Error("Failed to close database", "err", err)
  130. }
  131. }
  132. func (db *LDBDatabase) LDB() *leveldb.DB {
  133. return db.db
  134. }
  135. // Meter configures the database metrics collectors and
  136. func (db *LDBDatabase) Meter(prefix string) {
  137. if metrics.Enabled {
  138. // Initialize all the metrics collector at the requested prefix
  139. db.compTimeMeter = metrics.NewRegisteredMeter(prefix+"compact/time", nil)
  140. db.compReadMeter = metrics.NewRegisteredMeter(prefix+"compact/input", nil)
  141. db.compWriteMeter = metrics.NewRegisteredMeter(prefix+"compact/output", nil)
  142. db.diskReadMeter = metrics.NewRegisteredMeter(prefix+"disk/read", nil)
  143. db.diskWriteMeter = metrics.NewRegisteredMeter(prefix+"disk/write", nil)
  144. }
  145. // Initialize write delay metrics no matter we are in metric mode or not.
  146. db.writeDelayMeter = metrics.NewRegisteredMeter(prefix+"compact/writedelay/duration", nil)
  147. db.writeDelayNMeter = metrics.NewRegisteredMeter(prefix+"compact/writedelay/counter", nil)
  148. // Create a quit channel for the periodic collector and run it
  149. db.quitLock.Lock()
  150. db.quitChan = make(chan chan error)
  151. db.quitLock.Unlock()
  152. go db.meter(3 * time.Second)
  153. }
  154. // meter periodically retrieves internal leveldb counters and reports them to
  155. // the metrics subsystem.
  156. //
  157. // This is how a stats table look like (currently):
  158. // Compactions
  159. // Level | Tables | Size(MB) | Time(sec) | Read(MB) | Write(MB)
  160. // -------+------------+---------------+---------------+---------------+---------------
  161. // 0 | 0 | 0.00000 | 1.27969 | 0.00000 | 12.31098
  162. // 1 | 85 | 109.27913 | 28.09293 | 213.92493 | 214.26294
  163. // 2 | 523 | 1000.37159 | 7.26059 | 66.86342 | 66.77884
  164. // 3 | 570 | 1113.18458 | 0.00000 | 0.00000 | 0.00000
  165. //
  166. // This is how the write delay look like (currently):
  167. // DelayN:5 Delay:406.604657ms Paused: false
  168. //
  169. // This is how the iostats look like (currently):
  170. // Read(MB):3895.04860 Write(MB):3654.64712
  171. func (db *LDBDatabase) meter(refresh time.Duration) {
  172. // Create the counters to store current and previous compaction values
  173. compactions := make([][]float64, 2)
  174. for i := 0; i < 2; i++ {
  175. compactions[i] = make([]float64, 3)
  176. }
  177. // Create storage for iostats.
  178. var iostats [2]float64
  179. // Create storage and warning log tracer for write delay.
  180. var (
  181. delaystats [2]int64
  182. lastWriteDelay time.Time
  183. lastWriteDelayN time.Time
  184. lastWritePaused time.Time
  185. )
  186. var (
  187. errc chan error
  188. merr error
  189. )
  190. // Iterate ad infinitum and collect the stats
  191. for i := 1; errc == nil && merr == nil; i++ {
  192. // Retrieve the database stats
  193. stats, err := db.db.GetProperty("leveldb.stats")
  194. if err != nil {
  195. db.log.Error("Failed to read database stats", "err", err)
  196. merr = err
  197. continue
  198. }
  199. // Find the compaction table, skip the header
  200. lines := strings.Split(stats, "\n")
  201. for len(lines) > 0 && strings.TrimSpace(lines[0]) != "Compactions" {
  202. lines = lines[1:]
  203. }
  204. if len(lines) <= 3 {
  205. db.log.Error("Compaction table not found")
  206. merr = errors.New("compaction table not found")
  207. continue
  208. }
  209. lines = lines[3:]
  210. // Iterate over all the table rows, and accumulate the entries
  211. for j := 0; j < len(compactions[i%2]); j++ {
  212. compactions[i%2][j] = 0
  213. }
  214. for _, line := range lines {
  215. parts := strings.Split(line, "|")
  216. if len(parts) != 6 {
  217. break
  218. }
  219. for idx, counter := range parts[3:] {
  220. value, err := strconv.ParseFloat(strings.TrimSpace(counter), 64)
  221. if err != nil {
  222. db.log.Error("Compaction entry parsing failed", "err", err)
  223. merr = err
  224. continue
  225. }
  226. compactions[i%2][idx] += value
  227. }
  228. }
  229. // Update all the requested meters
  230. if db.compTimeMeter != nil {
  231. db.compTimeMeter.Mark(int64((compactions[i%2][0] - compactions[(i-1)%2][0]) * 1000 * 1000 * 1000))
  232. }
  233. if db.compReadMeter != nil {
  234. db.compReadMeter.Mark(int64((compactions[i%2][1] - compactions[(i-1)%2][1]) * 1024 * 1024))
  235. }
  236. if db.compWriteMeter != nil {
  237. db.compWriteMeter.Mark(int64((compactions[i%2][2] - compactions[(i-1)%2][2]) * 1024 * 1024))
  238. }
  239. // Retrieve the write delay statistic
  240. writedelay, err := db.db.GetProperty("leveldb.writedelay")
  241. if err != nil {
  242. db.log.Error("Failed to read database write delay statistic", "err", err)
  243. merr = err
  244. continue
  245. }
  246. var (
  247. delayN int64
  248. delayDuration string
  249. duration time.Duration
  250. paused bool
  251. )
  252. if n, err := fmt.Sscanf(writedelay, "DelayN:%d Delay:%s Paused:%t", &delayN, &delayDuration, &paused); n != 3 || err != nil {
  253. db.log.Error("Write delay statistic not found")
  254. merr = err
  255. continue
  256. }
  257. duration, err = time.ParseDuration(delayDuration)
  258. if err != nil {
  259. db.log.Error("Failed to parse delay duration", "err", err)
  260. merr = err
  261. continue
  262. }
  263. if db.writeDelayNMeter != nil {
  264. db.writeDelayNMeter.Mark(delayN - delaystats[0])
  265. // If the write delay number been collected in the last minute exceeds the predefined threshold,
  266. // print a warning log here.
  267. // If a warning that db performance is laggy has been displayed,
  268. // any subsequent warnings will be withhold for 1 minute to don't overwhelm the user.
  269. if int(db.writeDelayNMeter.Rate1()) > writeDelayNThreshold &&
  270. time.Now().After(lastWriteDelayN.Add(writeDelayWarningThrottler)) {
  271. db.log.Warn("Write delay number exceeds the threshold (200 per second) in the last minute")
  272. lastWriteDelayN = time.Now()
  273. }
  274. }
  275. if db.writeDelayMeter != nil {
  276. db.writeDelayMeter.Mark(duration.Nanoseconds() - delaystats[1])
  277. // If the write delay duration been collected in the last minute exceeds the predefined threshold,
  278. // print a warning log here.
  279. // If a warning that db performance is laggy has been displayed,
  280. // any subsequent warnings will be withhold for 1 minute to don't overwhelm the user.
  281. if int64(db.writeDelayMeter.Rate1()) > writeDelayThreshold.Nanoseconds() &&
  282. time.Now().After(lastWriteDelay.Add(writeDelayWarningThrottler)) {
  283. db.log.Warn("Write delay duration exceeds the threshold (35% of the time) in the last minute")
  284. lastWriteDelay = time.Now()
  285. }
  286. }
  287. // If a warning that db is performing compaction has been displayed, any subsequent
  288. // warnings will be withheld for one minute not to overwhelm the user.
  289. if paused && delayN-delaystats[0] == 0 && duration.Nanoseconds()-delaystats[1] == 0 &&
  290. time.Now().After(lastWritePaused.Add(writeDelayWarningThrottler)) {
  291. db.log.Warn("Database compacting, degraded performance")
  292. lastWritePaused = time.Now()
  293. }
  294. delaystats[0], delaystats[1] = delayN, duration.Nanoseconds()
  295. // Retrieve the database iostats.
  296. ioStats, err := db.db.GetProperty("leveldb.iostats")
  297. if err != nil {
  298. db.log.Error("Failed to read database iostats", "err", err)
  299. merr = err
  300. continue
  301. }
  302. var nRead, nWrite float64
  303. parts := strings.Split(ioStats, " ")
  304. if len(parts) < 2 {
  305. db.log.Error("Bad syntax of ioStats", "ioStats", ioStats)
  306. merr = fmt.Errorf("bad syntax of ioStats %s", ioStats)
  307. continue
  308. }
  309. if n, err := fmt.Sscanf(parts[0], "Read(MB):%f", &nRead); n != 1 || err != nil {
  310. db.log.Error("Bad syntax of read entry", "entry", parts[0])
  311. merr = err
  312. continue
  313. }
  314. if n, err := fmt.Sscanf(parts[1], "Write(MB):%f", &nWrite); n != 1 || err != nil {
  315. db.log.Error("Bad syntax of write entry", "entry", parts[1])
  316. merr = err
  317. continue
  318. }
  319. if db.diskReadMeter != nil {
  320. db.diskReadMeter.Mark(int64((nRead - iostats[0]) * 1024 * 1024))
  321. }
  322. if db.diskWriteMeter != nil {
  323. db.diskWriteMeter.Mark(int64((nWrite - iostats[1]) * 1024 * 1024))
  324. }
  325. iostats[0], iostats[1] = nRead, nWrite
  326. // Sleep a bit, then repeat the stats collection
  327. select {
  328. case errc = <-db.quitChan:
  329. // Quit requesting, stop hammering the database
  330. case <-time.After(refresh):
  331. // Timeout, gather a new set of stats
  332. }
  333. }
  334. if errc == nil {
  335. errc = <-db.quitChan
  336. }
  337. errc <- merr
  338. }
  339. func (db *LDBDatabase) NewBatch() Batch {
  340. return &ldbBatch{db: db.db, b: new(leveldb.Batch)}
  341. }
  342. type ldbBatch struct {
  343. db *leveldb.DB
  344. b *leveldb.Batch
  345. size int
  346. }
  347. func (b *ldbBatch) Put(key, value []byte) error {
  348. b.b.Put(key, value)
  349. b.size += len(value)
  350. return nil
  351. }
  352. func (b *ldbBatch) Write() error {
  353. return b.db.Write(b.b, nil)
  354. }
  355. func (b *ldbBatch) ValueSize() int {
  356. return b.size
  357. }
  358. func (b *ldbBatch) Reset() {
  359. b.b.Reset()
  360. b.size = 0
  361. }
  362. type table struct {
  363. db Database
  364. prefix string
  365. }
  366. // NewTable returns a Database object that prefixes all keys with a given
  367. // string.
  368. func NewTable(db Database, prefix string) Database {
  369. return &table{
  370. db: db,
  371. prefix: prefix,
  372. }
  373. }
  374. func (dt *table) Put(key []byte, value []byte) error {
  375. return dt.db.Put(append([]byte(dt.prefix), key...), value)
  376. }
  377. func (dt *table) Has(key []byte) (bool, error) {
  378. return dt.db.Has(append([]byte(dt.prefix), key...))
  379. }
  380. func (dt *table) Get(key []byte) ([]byte, error) {
  381. return dt.db.Get(append([]byte(dt.prefix), key...))
  382. }
  383. func (dt *table) Delete(key []byte) error {
  384. return dt.db.Delete(append([]byte(dt.prefix), key...))
  385. }
  386. func (dt *table) Close() {
  387. // Do nothing; don't close the underlying DB.
  388. }
  389. type tableBatch struct {
  390. batch Batch
  391. prefix string
  392. }
  393. // NewTableBatch returns a Batch object which prefixes all keys with a given string.
  394. func NewTableBatch(db Database, prefix string) Batch {
  395. return &tableBatch{db.NewBatch(), prefix}
  396. }
  397. func (dt *table) NewBatch() Batch {
  398. return &tableBatch{dt.db.NewBatch(), dt.prefix}
  399. }
  400. func (tb *tableBatch) Put(key, value []byte) error {
  401. return tb.batch.Put(append([]byte(tb.prefix), key...), value)
  402. }
  403. func (tb *tableBatch) Write() error {
  404. return tb.batch.Write()
  405. }
  406. func (tb *tableBatch) ValueSize() int {
  407. return tb.batch.ValueSize()
  408. }
  409. func (tb *tableBatch) Reset() {
  410. tb.batch.Reset()
  411. }