dataStore_bolt.go 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492
  1. //go:build !PSIPHON_USE_BADGER_DB && !PSIPHON_USE_FILES_DB
  2. // +build !PSIPHON_USE_BADGER_DB,!PSIPHON_USE_FILES_DB
  3. /*
  4. * Copyright (c) 2018, Psiphon Inc.
  5. * All rights reserved.
  6. *
  7. * This program is free software: you can redistribute it and/or modify
  8. * it under the terms of the GNU General Public License as published by
  9. * the Free Software Foundation, either version 3 of the License, or
  10. * (at your option) any later version.
  11. *
  12. * This program is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  15. * GNU General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU General Public License
  18. * along with this program. If not, see <http://www.gnu.org/licenses/>.
  19. *
  20. */
  21. package psiphon
  22. import (
  23. std_errors "errors"
  24. "os"
  25. "path/filepath"
  26. "runtime/debug"
  27. "sync/atomic"
  28. "time"
  29. "github.com/Psiphon-Labs/bolt"
  30. "github.com/Psiphon-Labs/psiphon-tunnel-core/psiphon/common/errors"
  31. )
  32. const (
  33. OPEN_DB_RETRIES = 2
  34. )
  35. type datastoreDB struct {
  36. boltDB *bolt.DB
  37. isFailed int32
  38. }
  39. type datastoreTx struct {
  40. db *datastoreDB
  41. boltTx *bolt.Tx
  42. }
  43. type datastoreBucket struct {
  44. db *datastoreDB
  45. boltBucket *bolt.Bucket
  46. }
  47. type datastoreCursor struct {
  48. db *datastoreDB
  49. boltCursor *bolt.Cursor
  50. }
  51. func datastoreOpenDB(
  52. rootDataDirectory string, retryAndReset bool) (*datastoreDB, error) {
  53. var db *datastoreDB
  54. var err error
  55. attempts := 1
  56. if retryAndReset {
  57. attempts += OPEN_DB_RETRIES
  58. }
  59. reset := false
  60. for attempt := 0; attempt < attempts; attempt++ {
  61. db, err = tryDatastoreOpenDB(rootDataDirectory, reset)
  62. if err == nil {
  63. break
  64. }
  65. NoticeWarning("tryDatastoreOpenDB failed: %s", err)
  66. // The datastore file may be corrupt, so, in subsequent iterations,
  67. // set the "reset" flag and attempt to delete the file and try again.
  68. //
  69. // Don't reset the datastore when open failed due to timeout obtaining
  70. // the file lock, as the datastore is simply locked by another
  71. // process and not corrupt. As the file lock is advisory, deleting
  72. // the file would succeed despite the lock. In this case, still retry
  73. // in case the the lock is released.
  74. reset = !std_errors.Is(err, bolt.ErrTimeout)
  75. }
  76. return db, err
  77. }
  78. func tryDatastoreOpenDB(
  79. rootDataDirectory string, reset bool) (retdb *datastoreDB, reterr error) {
  80. // Testing indicates that the bolt Check function can raise SIGSEGV due to
  81. // invalid mmap buffer accesses in cases such as opening a valid but
  82. // truncated datastore file.
  83. //
  84. // To handle this, we temporarily set SetPanicOnFault in order to treat the
  85. // fault as a panic, recover any panic, and return an error which will result
  86. // in a retry with reset.
  87. // Begin recovery preamble
  88. panicOnFault := debug.SetPanicOnFault(true)
  89. defer debug.SetPanicOnFault(panicOnFault)
  90. defer func() {
  91. if r := recover(); r != nil {
  92. retdb = nil
  93. reterr = errors.Tracef("panic: %v", r)
  94. }
  95. }()
  96. // End recovery preamble
  97. filename := filepath.Join(rootDataDirectory, "psiphon.boltdb")
  98. if reset {
  99. NoticeWarning("tryDatastoreOpenDB: reset")
  100. os.Remove(filename)
  101. }
  102. newDB, err := bolt.Open(filename, 0600, &bolt.Options{Timeout: 1 * time.Second})
  103. if err != nil {
  104. return nil, errors.Trace(err)
  105. }
  106. // Run consistency checks on datastore and emit errors for diagnostics
  107. // purposes. We assume this will complete quickly for typical size Psiphon
  108. // datastores and wait for the check to complete before proceeding.
  109. err = newDB.View(func(tx *bolt.Tx) error {
  110. return tx.SynchronousCheck()
  111. })
  112. if err != nil {
  113. return nil, errors.Trace(err)
  114. }
  115. err = newDB.Update(func(tx *bolt.Tx) error {
  116. requiredBuckets := [][]byte{
  117. datastoreServerEntriesBucket,
  118. datastoreServerEntryTagsBucket,
  119. datastoreServerEntryTombstoneTagsBucket,
  120. datastoreUrlETagsBucket,
  121. datastoreKeyValueBucket,
  122. datastoreRemoteServerListStatsBucket,
  123. datastoreFailedTunnelStatsBucket,
  124. datastoreSLOKsBucket,
  125. datastoreTacticsBucket,
  126. datastoreSpeedTestSamplesBucket,
  127. datastoreDialParametersBucket,
  128. }
  129. for _, bucket := range requiredBuckets {
  130. _, err := tx.CreateBucketIfNotExists(bucket)
  131. if err != nil {
  132. return err
  133. }
  134. }
  135. return nil
  136. })
  137. if err != nil {
  138. return nil, errors.Trace(err)
  139. }
  140. // Cleanup obsolete buckets
  141. err = newDB.Update(func(tx *bolt.Tx) error {
  142. obsoleteBuckets := [][]byte{
  143. []byte("tunnelStats"),
  144. []byte("rankedServerEntries"),
  145. []byte("splitTunnelRouteETags"),
  146. []byte("splitTunnelRouteData"),
  147. }
  148. for _, obsoleteBucket := range obsoleteBuckets {
  149. if tx.Bucket(obsoleteBucket) != nil {
  150. err := tx.DeleteBucket(obsoleteBucket)
  151. if err != nil {
  152. NoticeWarning("DeleteBucket %s error: %s", obsoleteBucket, err)
  153. // Continue, since this is not fatal
  154. }
  155. }
  156. }
  157. return nil
  158. })
  159. if err != nil {
  160. return nil, errors.Trace(err)
  161. }
  162. return &datastoreDB{boltDB: newDB}, nil
  163. }
  164. var errDatastoreFailed = std_errors.New("datastore has failed")
  165. func (db *datastoreDB) isDatastoreFailed() bool {
  166. return atomic.LoadInt32(&db.isFailed) == 1
  167. }
  168. func (db *datastoreDB) setDatastoreFailed(r interface{}) {
  169. atomic.StoreInt32(&db.isFailed, 1)
  170. NoticeWarning("Datastore failed: %s", errors.Tracef("panic: %v", r))
  171. }
  172. func (db *datastoreDB) close() error {
  173. // Limitation: there is no panic recover in this case. We assume boltDB.Close
  174. // does not make mmap accesses and prefer to not continue with the datastore
  175. // file in a locked or open state. We also assume that any locks aquired by
  176. // boltDB.Close, held by transactions, will be released even if the
  177. // transaction panics and the database is in the failed state.
  178. return db.boltDB.Close()
  179. }
  180. func (db *datastoreDB) view(fn func(tx *datastoreTx) error) (reterr error) {
  181. // Any bolt function that performs mmap buffer accesses can raise SIGBUS due
  182. // to underlying storage changes, such as a truncation of the datastore file
  183. // or removal or network attached storage, etc.
  184. //
  185. // To handle this, we temporarily set SetPanicOnFault in order to treat the
  186. // fault as a panic, recover any panic to avoid crashing the process, and
  187. // putting this datastoreDB instance into a failed state. All subsequent
  188. // calls to this datastoreDBinstance or its related datastoreTx and
  189. // datastoreBucket instances will fail.
  190. // Begin recovery preamble
  191. if db.isDatastoreFailed() {
  192. return errDatastoreFailed
  193. }
  194. panicOnFault := debug.SetPanicOnFault(true)
  195. defer debug.SetPanicOnFault(panicOnFault)
  196. defer func() {
  197. if r := recover(); r != nil {
  198. db.setDatastoreFailed(r)
  199. reterr = errDatastoreFailed
  200. }
  201. }()
  202. // End recovery preamble
  203. return db.boltDB.View(
  204. func(tx *bolt.Tx) error {
  205. err := fn(&datastoreTx{db: db, boltTx: tx})
  206. if err != nil {
  207. return errors.Trace(err)
  208. }
  209. return nil
  210. })
  211. }
  212. func (db *datastoreDB) update(fn func(tx *datastoreTx) error) (reterr error) {
  213. // Begin recovery preamble
  214. if db.isDatastoreFailed() {
  215. return errDatastoreFailed
  216. }
  217. panicOnFault := debug.SetPanicOnFault(true)
  218. defer debug.SetPanicOnFault(panicOnFault)
  219. defer func() {
  220. if r := recover(); r != nil {
  221. db.setDatastoreFailed(r)
  222. reterr = errDatastoreFailed
  223. }
  224. }()
  225. // End recovery preamble
  226. return db.boltDB.Update(
  227. func(tx *bolt.Tx) error {
  228. err := fn(&datastoreTx{db: db, boltTx: tx})
  229. if err != nil {
  230. return errors.Trace(err)
  231. }
  232. return nil
  233. })
  234. }
  235. func (tx *datastoreTx) bucket(name []byte) (retbucket *datastoreBucket) {
  236. // Begin recovery preamble
  237. if tx.db.isDatastoreFailed() {
  238. return &datastoreBucket{db: tx.db, boltBucket: nil}
  239. }
  240. panicOnFault := debug.SetPanicOnFault(true)
  241. defer debug.SetPanicOnFault(panicOnFault)
  242. defer func() {
  243. if r := recover(); r != nil {
  244. tx.db.setDatastoreFailed(r)
  245. retbucket = &datastoreBucket{db: tx.db, boltBucket: nil}
  246. }
  247. }()
  248. // End recovery preamble
  249. return &datastoreBucket{db: tx.db, boltBucket: tx.boltTx.Bucket(name)}
  250. }
  251. func (tx *datastoreTx) clearBucket(name []byte) (reterr error) {
  252. // Begin recovery preamble
  253. if tx.db.isDatastoreFailed() {
  254. return errDatastoreFailed
  255. }
  256. panicOnFault := debug.SetPanicOnFault(true)
  257. defer debug.SetPanicOnFault(panicOnFault)
  258. defer func() {
  259. if r := recover(); r != nil {
  260. tx.db.setDatastoreFailed(r)
  261. reterr = errDatastoreFailed
  262. }
  263. }()
  264. // End recovery preamble
  265. err := tx.boltTx.DeleteBucket(name)
  266. if err != nil {
  267. return errors.Trace(err)
  268. }
  269. _, err = tx.boltTx.CreateBucket(name)
  270. if err != nil {
  271. return errors.Trace(err)
  272. }
  273. return nil
  274. }
  275. func (b *datastoreBucket) get(key []byte) (retvalue []byte) {
  276. // Begin recovery preamble
  277. if b.db.isDatastoreFailed() {
  278. return nil
  279. }
  280. panicOnFault := debug.SetPanicOnFault(true)
  281. defer debug.SetPanicOnFault(panicOnFault)
  282. defer func() {
  283. if r := recover(); r != nil {
  284. b.db.setDatastoreFailed(r)
  285. retvalue = nil
  286. }
  287. }()
  288. // End recovery preamble
  289. return b.boltBucket.Get(key)
  290. }
  291. func (b *datastoreBucket) put(key, value []byte) (reterr error) {
  292. // Begin recovery preamble
  293. if b.db.isDatastoreFailed() {
  294. return errDatastoreFailed
  295. }
  296. panicOnFault := debug.SetPanicOnFault(true)
  297. defer debug.SetPanicOnFault(panicOnFault)
  298. defer func() {
  299. if r := recover(); r != nil {
  300. b.db.setDatastoreFailed(r)
  301. reterr = errDatastoreFailed
  302. }
  303. }()
  304. // End recovery preamble
  305. err := b.boltBucket.Put(key, value)
  306. if err != nil {
  307. return errors.Trace(err)
  308. }
  309. return nil
  310. }
  311. func (b *datastoreBucket) delete(key []byte) (reterr error) {
  312. // Begin recovery preamble
  313. if b.db.isDatastoreFailed() {
  314. return errDatastoreFailed
  315. }
  316. panicOnFault := debug.SetPanicOnFault(true)
  317. defer debug.SetPanicOnFault(panicOnFault)
  318. defer func() {
  319. if r := recover(); r != nil {
  320. b.db.setDatastoreFailed(r)
  321. reterr = errDatastoreFailed
  322. }
  323. }()
  324. // End recovery preamble
  325. err := b.boltBucket.Delete(key)
  326. if err != nil {
  327. return errors.Trace(err)
  328. }
  329. return nil
  330. }
  331. func (b *datastoreBucket) cursor() (retcursor datastoreCursor) {
  332. // Begin recovery preamble
  333. if b.db.isDatastoreFailed() {
  334. return datastoreCursor{db: b.db, boltCursor: nil}
  335. }
  336. panicOnFault := debug.SetPanicOnFault(true)
  337. defer debug.SetPanicOnFault(panicOnFault)
  338. defer func() {
  339. if r := recover(); r != nil {
  340. b.db.setDatastoreFailed(r)
  341. retcursor = datastoreCursor{db: b.db, boltCursor: nil}
  342. }
  343. }()
  344. // End recovery preamble
  345. return datastoreCursor{db: b.db, boltCursor: b.boltBucket.Cursor()}
  346. }
  347. func (c *datastoreCursor) firstKey() (retkey []byte) {
  348. // Begin recovery preamble
  349. if c.db.isDatastoreFailed() {
  350. return nil
  351. }
  352. panicOnFault := debug.SetPanicOnFault(true)
  353. defer debug.SetPanicOnFault(panicOnFault)
  354. defer func() {
  355. if r := recover(); r != nil {
  356. c.db.setDatastoreFailed(r)
  357. retkey = nil
  358. }
  359. }()
  360. // End recovery preamble
  361. key, _ := c.boltCursor.First()
  362. return key
  363. }
  364. func (c *datastoreCursor) nextKey() (retkey []byte) {
  365. // Begin recovery preamble
  366. if c.db.isDatastoreFailed() {
  367. return nil
  368. }
  369. panicOnFault := debug.SetPanicOnFault(true)
  370. defer debug.SetPanicOnFault(panicOnFault)
  371. defer func() {
  372. if r := recover(); r != nil {
  373. c.db.setDatastoreFailed(r)
  374. retkey = nil
  375. }
  376. }()
  377. // End recovery preamble
  378. key, _ := c.boltCursor.Next()
  379. return key
  380. }
  381. func (c *datastoreCursor) first() (retkey, retvalue []byte) {
  382. // Begin recovery preamble
  383. if c.db.isDatastoreFailed() {
  384. return nil, nil
  385. }
  386. panicOnFault := debug.SetPanicOnFault(true)
  387. defer debug.SetPanicOnFault(panicOnFault)
  388. defer func() {
  389. if r := recover(); r != nil {
  390. c.db.setDatastoreFailed(r)
  391. retkey = nil
  392. retvalue = nil
  393. }
  394. }()
  395. // End recovery preamble
  396. return c.boltCursor.First()
  397. }
  398. func (c *datastoreCursor) next() (retkey, retvalue []byte) {
  399. // Begin recovery preamble
  400. if c.db.isDatastoreFailed() {
  401. return nil, nil
  402. }
  403. panicOnFault := debug.SetPanicOnFault(true)
  404. defer debug.SetPanicOnFault(panicOnFault)
  405. defer func() {
  406. if r := recover(); r != nil {
  407. c.db.setDatastoreFailed(r)
  408. retkey = nil
  409. retvalue = nil
  410. }
  411. }()
  412. // End recovery preamble
  413. return c.boltCursor.Next()
  414. }
  415. func (c *datastoreCursor) close() {
  416. // BoltDB doesn't close cursors.
  417. }