Compare commits

...

6 Commits

Author SHA1 Message Date
James Mills
2400dd86d5 Add docs for bitcask 2019-03-21 17:46:53 +10:00
James Mills
27eb922ba2 Add docs for options 2019-03-21 17:20:53 +10:00
James Mills
34ad78efc0 Add KeYS command to server (bitraftd) 2019-03-21 10:49:53 +10:00
James Mills
352c32ee12 Add Len() to exported API (extended API) 2019-03-21 10:47:50 +10:00
James Mills
aaea7273c3 Add Keys() to exported API (extended API) 2019-03-21 10:41:56 +10:00
James Mills
01cb269a51 Add EXISTS command to server (bitraftd) 2019-03-21 10:29:18 +10:00
5 changed files with 115 additions and 36 deletions

View File

@@ -16,13 +16,29 @@ import (
) )
var ( var (
ErrKeyNotFound = errors.New("error: key not found") // ErrKeyNotFound is the error returned when a key is not found
ErrKeyTooLarge = errors.New("error: key too large") ErrKeyNotFound = errors.New("error: key not found")
ErrValueTooLarge = errors.New("error: value too large")
// ErrKeyTooLarge is the error returned for a key that exceeds the
// maximum allowed key size (configured with WithMaxKeySize).
ErrKeyTooLarge = errors.New("error: key too large")
// ErrValueTooLarge is the error returned for a value that exceeds the
// maximum allowed value size (configured with WithMaxValueSize).
ErrValueTooLarge = errors.New("error: value too large")
// ErrChecksumFailed is the error returned if a key/valie retrieved does
// not match its CRC checksum
ErrChecksumFailed = errors.New("error: checksum failed") ErrChecksumFailed = errors.New("error: checksum failed")
// ErrDatabaseLocked is the error returned if the database is locked
// (typically opened by another process)
ErrDatabaseLocked = errors.New("error: database locked") ErrDatabaseLocked = errors.New("error: database locked")
) )
// Bitcask is a struct that represents a on-disk LSM and WAL data structure
// and in-memory hash of key/value pairs as per the Bitcask paper and seen
// in the Riak database.
type Bitcask struct { type Bitcask struct {
*flock.Flock *flock.Flock
@@ -32,10 +48,11 @@ type Bitcask struct {
keydir *internal.Keydir keydir *internal.Keydir
datafiles []*internal.Datafile datafiles []*internal.Datafile
trie *trie.Trie trie *trie.Trie
maxDatafileSize int64
} }
// Close closes the database and removes the lock. It is important to call
// Close() as this is the only wat to cleanup the lock held by the open
// database.
func (b *Bitcask) Close() error { func (b *Bitcask) Close() error {
defer func() { defer func() {
b.Flock.Unlock() b.Flock.Unlock()
@@ -48,10 +65,13 @@ func (b *Bitcask) Close() error {
return b.curr.Close() return b.curr.Close()
} }
// Sync flushes all buffers to disk ensuring all data is written
func (b *Bitcask) Sync() error { func (b *Bitcask) Sync() error {
return b.curr.Sync() return b.curr.Sync()
} }
// Get retrieves the value of the given key. If the key is not found or an/I/O
// error occurs a null byte slice is returend along with the error.
func (b *Bitcask) Get(key string) ([]byte, error) { func (b *Bitcask) Get(key string) ([]byte, error) {
var df *internal.Datafile var df *internal.Datafile
@@ -79,16 +99,18 @@ func (b *Bitcask) Get(key string) ([]byte, error) {
return e.Value, nil return e.Value, nil
} }
// Has returns true if the key exists in the database, false otherwise.
func (b *Bitcask) Has(key string) bool { func (b *Bitcask) Has(key string) bool {
_, ok := b.keydir.Get(key) _, ok := b.keydir.Get(key)
return ok return ok
} }
// Put stores the key and value in the database.
func (b *Bitcask) Put(key string, value []byte) error { func (b *Bitcask) Put(key string, value []byte) error {
if len(key) > b.config.MaxKeySize { if len(key) > b.config.maxKeySize {
return ErrKeyTooLarge return ErrKeyTooLarge
} }
if len(value) > b.config.MaxValueSize { if len(value) > b.config.maxValueSize {
return ErrValueTooLarge return ErrValueTooLarge
} }
@@ -103,6 +125,8 @@ func (b *Bitcask) Put(key string, value []byte) error {
return nil return nil
} }
// Delete deletes the named key. If the key doesn't exist or an I/O error
// occurs the error is returned.
func (b *Bitcask) Delete(key string) error { func (b *Bitcask) Delete(key string) error {
_, err := b.put(key, []byte{}) _, err := b.put(key, []byte{})
if err != nil { if err != nil {
@@ -115,6 +139,9 @@ func (b *Bitcask) Delete(key string) error {
return nil return nil
} }
// Scan performa a prefix scan of keys matching the given prefix and calling
// the function `f` with the keys found. If the function returns an error
// no further keys are processed and the first error returned.
func (b *Bitcask) Scan(prefix string, f func(key string) error) error { func (b *Bitcask) Scan(prefix string, f func(key string) error) error {
keys := b.trie.PrefixSearch(prefix) keys := b.trie.PrefixSearch(prefix)
for _, key := range keys { for _, key := range keys {
@@ -125,6 +152,19 @@ func (b *Bitcask) Scan(prefix string, f func(key string) error) error {
return nil return nil
} }
// Len returns the total number of keys in the database
func (b *Bitcask) Len() int {
return b.keydir.Len()
}
// Keys returns all keys in the database as a channel of string(s)
func (b *Bitcask) Keys() chan string {
return b.keydir.Keys()
}
// Fold iterates over all keys in the database calling the function `f` for
// each key. If the function returns an error, no further keys are processed
// and the error returned.
func (b *Bitcask) Fold(f func(key string) error) error { func (b *Bitcask) Fold(f func(key string) error) error {
for key := range b.keydir.Keys() { for key := range b.keydir.Keys() {
if err := f(key); err != nil { if err := f(key); err != nil {
@@ -140,7 +180,7 @@ func (b *Bitcask) put(key string, value []byte) (int64, error) {
return -1, err return -1, err
} }
if size >= b.maxDatafileSize { if size >= int64(b.config.maxDatafileSize) {
err := b.curr.Close() err := b.curr.Close()
if err != nil { if err != nil {
return -1, err return -1, err
@@ -165,11 +205,9 @@ func (b *Bitcask) put(key string, value []byte) (int64, error) {
return b.curr.Write(e) return b.curr.Write(e)
} }
func (b *Bitcask) setMaxDatafileSize(size int64) error { // Merge merges all datafiles in the database creating hint files for faster
b.maxDatafileSize = size // startup. Old keys are squashed and deleted keys removes. Call this function
return nil // periodically to reclaim disk space.
}
func Merge(path string, force bool) error { func Merge(path string, force bool) error {
fns, err := internal.GetDatafiles(path) fns, err := internal.GetDatafiles(path)
if err != nil { if err != nil {
@@ -276,7 +314,10 @@ func Merge(path string, force bool) error {
return nil return nil
} }
func Open(path string, options ...option) (*Bitcask, error) { // Open opens the database at the given path with optional options.
// Options can be provided with the `WithXXX` functions that provide
// configuration options as functions.
func Open(path string, options ...Option) (*Bitcask, error) {
if err := os.MkdirAll(path, 0755); err != nil { if err := os.MkdirAll(path, 0755); err != nil {
return nil, err return nil, err
} }
@@ -365,8 +406,6 @@ func Open(path string, options ...option) (*Bitcask, error) {
keydir: keydir, keydir: keydir,
datafiles: datafiles, datafiles: datafiles,
trie: trie, trie: trie,
maxDatafileSize: DefaultMaxDatafileSize,
} }
for _, opt := range options { for _, opt := range options {

View File

@@ -40,10 +40,22 @@ func TestAll(t *testing.T) {
assert.Equal([]byte("bar"), val) assert.Equal([]byte("bar"), val)
}) })
t.Run("Len", func(t *testing.T) {
assert.Equal(1, db.Len())
})
t.Run("Has", func(t *testing.T) { t.Run("Has", func(t *testing.T) {
assert.True(db.Has("foo")) assert.True(db.Has("foo"))
}) })
t.Run("Keys", func(t *testing.T) {
keys := make([]string, 0)
for key := range db.Keys() {
keys = append(keys, key)
}
assert.Equal([]string{"foo"}, keys)
})
t.Run("Fold", func(t *testing.T) { t.Run("Fold", func(t *testing.T) {
var ( var (
keys []string keys []string

View File

@@ -96,6 +96,22 @@ func main() {
} else { } else {
conn.WriteBulk(value) conn.WriteBulk(value)
} }
case "keys":
conn.WriteArray(db.Len())
for key := range db.Keys() {
conn.WriteBulk([]byte(key))
}
case "exists":
if len(cmd.Args) != 2 {
conn.WriteError("ERR wrong number of arguments for '" + string(cmd.Args[0]) + "' command")
return
}
key := string(cmd.Args[1])
if db.Has(key) {
conn.WriteInt(1)
} else {
conn.WriteInt(0)
}
case "del": case "del":
if len(cmd.Args) != 2 { if len(cmd.Args) != 2 {
conn.WriteError("ERR wrong number of arguments for '" + string(cmd.Args[0]) + "' command") conn.WriteError("ERR wrong number of arguments for '" + string(cmd.Args[0]) + "' command")

View File

@@ -52,11 +52,17 @@ func (k *Keydir) Delete(key string) {
delete(k.kv, key) delete(k.kv, key)
} }
func (k *Keydir) Len() int {
return len(k.kv)
}
func (k *Keydir) Keys() chan string { func (k *Keydir) Keys() chan string {
ch := make(chan string) ch := make(chan string)
go func() { go func() {
for k := range k.kv { k.RLock()
ch <- k defer k.RUnlock()
for key := range k.kv {
ch <- key
} }
close(ch) close(ch)
}() }()

View File

@@ -1,47 +1,53 @@
package bitcask package bitcask
const ( const (
// DefaultMaxDatafileSize is the default maximum datafile size in bytes
DefaultMaxDatafileSize = 1 << 20 // 1MB DefaultMaxDatafileSize = 1 << 20 // 1MB
DefaultMaxKeySize = 64 // 64 bytes
DefaultMaxValueSize = 1 << 16 // 65KB // DefaultMaxKeySize is the default maximum key size in bytes
DefaultMaxKeySize = 64 // 64 bytes
// DefaultMaxValueSize is the default value size in bytes
DefaultMaxValueSize = 1 << 16 // 65KB
) )
// Option ... // Option is a function that takes a config struct and modifies it
type Option option type Option func(*config) error
type option func(*config) error
type config struct { type config struct {
MaxDatafileSize int maxDatafileSize int
MaxKeySize int maxKeySize int
MaxValueSize int maxValueSize int
} }
func newDefaultConfig() *config { func newDefaultConfig() *config {
return &config{ return &config{
MaxDatafileSize: DefaultMaxDatafileSize, maxDatafileSize: DefaultMaxDatafileSize,
MaxKeySize: DefaultMaxKeySize, maxKeySize: DefaultMaxKeySize,
MaxValueSize: DefaultMaxValueSize, maxValueSize: DefaultMaxValueSize,
} }
} }
func WithMaxDatafileSize(size int) option { // WithMaxDatafileSize sets the maximum datafile size option
func WithMaxDatafileSize(size int) Option {
return func(cfg *config) error { return func(cfg *config) error {
cfg.MaxDatafileSize = size cfg.maxDatafileSize = size
return nil return nil
} }
} }
func WithMaxKeySize(size int) option { // WithMaxKeySize sets the maximum key size option
func WithMaxKeySize(size int) Option {
return func(cfg *config) error { return func(cfg *config) error {
cfg.MaxKeySize = size cfg.maxKeySize = size
return nil return nil
} }
} }
func WithMaxValueSize(size int) option { // WithMaxValueSize sets the maximum value size option
func WithMaxValueSize(size int) Option {
return func(cfg *config) error { return func(cfg *config) error {
cfg.MaxValueSize = size cfg.maxValueSize = size
return nil return nil
} }
} }