cockroachdb
diff --git a/‎storage/command_queue.go‎
Lines changed: 131 additions & 0 deletions b/‎storage/command_queue.go‎
Lines changed: 131 additions & 0 deletions
diff --git a/‎storage/command_queue_test.go‎
Lines changed: 167 additions & 0 deletions b/‎storage/command_queue_test.go‎
Lines changed: 167 additions & 0 deletions
diff --git a/‎storage/engine/in_mem.go‎
Lines changed: 1 addition & 1 deletion b/‎storage/engine/in_mem.go‎
Lines changed: 1 addition & 1 deletion
@@ -0,0 +1,131 @@
+// Copyright 2014 The Cockroach Authors.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+// implied. See the License for the specific language governing
+// permissions and limitations under the License. See the AUTHORS file
+// for names of contributors.
+//
+// Author: Spencer Kimball (spencer.kimball@gmail.com)
+
+package storage
+
+import (
+	"sync"
+
+	"github.com/cockroachdb/cockroach/storage/engine"
+	"github.com/cockroachdb/cockroach/util"
+)
+
+// A CommandQueue maintains an interval tree of keys or key ranges for
+// executing commands. New commands affecting keys or key ranges must
+// wait on already-executing commands which overlap their key range.
+//
+// Before executing, a command invokes GetWait() to initialize a
+// WaitGroup with the number of overlapping commands which are already
+// running. The wait group is waited on by the caller for confirmation
+// that all overlapping, pending commands have completed and the
+// pending command can proceed.
+//
+// After waiting, a command is added to the queue's already-executing
+// set via Add(). Add accepts a parameter indicating whether the
+// command is read-only. Read-only commands don't need to wait on
+// other read-only commands, so the wait group returned via GetWait()
+// doesn't include read-only on read-only overlapping commands as an
+// optimization.
+//
+// Once commands complete, Remove() is invoked to remove the executing
+// command and decrement the counts on any pending WaitGroups,
+// possibly signaling waiting commands who were gated by the executing
+// command's affected key(s).
+//
+// CommandQueue is not thread safe.
+type CommandQueue struct {
+	cache *util.IntervalCache
+}
+
+type cmd struct {
+	readOnly bool
+	pending  []*sync.WaitGroup // Pending commands gated on cmd
+}
+
+// NewCommandQueue returns a new command queue.
+func NewCommandQueue() *CommandQueue {
+	cq := &CommandQueue{
+		cache: util.NewIntervalCache(util.CacheConfig{Policy: util.CacheNone}),
+	}
+	cq.cache.OnEvicted = cq.onEvicted
+	return cq
+}
+
+// onEvicted is called when any entry is removed from the interval
+// tree. This happens on calls to Remove() and to Clear().
+func (cq *CommandQueue) onEvicted(key, value interface{}) {
+	c := value.(*cmd)
+	for _, wg := range c.pending {
+		wg.Done()
+	}
+}
+
+// GetWait initializes the supplied wait group with the number of
+// executing commands which overlap the specified key range. If end is
+// nil, end is set to start, meaning the command affects a single
+// key. The caller should call wg.Wait() to wait for confirmation that
+// all gating commands have completed or failed. readOnly is true if
+// the requester is a read-only command; false for read-write.
+func (cq *CommandQueue) GetWait(start, end engine.Key, readOnly bool, wg *sync.WaitGroup) {
+	if end == nil {
+		end = engine.NextKey(start)
+	}
+	for _, c := range cq.cache.GetOverlaps(rangeKey(start), rangeKey(end)) {
+		c := c.(*cmd)
+		// Only add to the wait group if both commands aren't read-only.
+		if !readOnly || !c.readOnly {
+			c.pending = append(c.pending, wg)
+			wg.Add(1)
+		}
+	}
+}
+
+// Add adds a command to the queue which affects the specified key
+// range. If end is nil, it is set to start, meaning the command
+// affects a single key. The returned interface is the key for the
+// command queue and must be re-supplied on subsequent invocation of
+// Remove().
+//
+// Add should be invoked after waiting on already-executing,
+// overlapping commands via the WaitGroup initialized through
+// GetWait().
+func (cq *CommandQueue) Add(start, end engine.Key, readOnly bool) interface{} {
+	if end == nil {
+		end = engine.NextKey(start)
+	}
+	key := cq.cache.NewKey(rangeKey(start), rangeKey(end))
+	cq.cache.Add(key, &cmd{readOnly: readOnly})
+	return key
+}
+
+// Remove is invoked to signal that the command associated with the
+// specified key has completed and should be removed. Any pending
+// commands waiting on this command will be signaled if this is the
+// only command upon which they are still waiting.
+//
+// Remove is invoked after a mutating command has been committed to
+// the Raft log and applied to the underlying state machine. Similarly,
+// Remove is invoked after a read-only command has been executed
+// against the underlying state machine.
+func (cq *CommandQueue) Remove(key interface{}) {
+	cq.cache.Del(key)
+}
+
+// Clear removes all executing commands, signaling any waiting commands.
+func (cq *CommandQueue) Clear() {
+	cq.cache.Clear()
+}
@@ -0,0 +1,167 @@
+// Copyright 2014 The Cockroach Authors.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+// implied. See the License for the specific language governing
+// permissions and limitations under the License. See the AUTHORS file
+// for names of contributors.
+//
+// Author: Spencer Kimball (spencer.kimball@gmail.com)
+
+package storage
+
+import (
+	"sync"
+	"testing"
+	"time"
+
+	"github.com/cockroachdb/cockroach/storage/engine"
+)
+
+// waitForCmd launches a goroutine to wait on the supplied
+// WaitGroup. A channel is returned which signals the completion of
+// the wait.
+func waitForCmd(wg *sync.WaitGroup) <-chan struct{} {
+	cmdDone := make(chan struct{})
+	go func() {
+		wg.Wait()
+		close(cmdDone)
+	}()
+	return cmdDone
+}
+
+// testCmdDone waits for the cmdDone channel to be closed for at most
+// the specified wait duration. Returns true if the command finished in
+// the allotted time, false otherwise.
+func testCmdDone(cmdDone <-chan struct{}, wait time.Duration) bool {
+	select {
+	case <-cmdDone:
+		return true
+	case <-time.After(wait):
+		return false
+	}
+}
+
+func TestCommandQueue(t *testing.T) {
+	cq := NewCommandQueue()
+	wg := sync.WaitGroup{}
+
+	// Try a command with no overlapping already-running commands.
+	cq.GetWait(engine.Key("a"), nil, false, &wg)
+	wg.Wait()
+	cq.GetWait(engine.Key("a"), engine.Key("b"), false, &wg)
+	wg.Wait()
+
+	// Add a command and verify wait group is returned.
+	wk := cq.Add(engine.Key("a"), nil, false)
+	cq.GetWait(engine.Key("a"), nil, false, &wg)
+	cmdDone := waitForCmd(&wg)
+	if testCmdDone(cmdDone, 1*time.Millisecond) {
+		t.Fatal("command should not finish with command outstanding")
+	}
+	cq.Remove(wk)
+	if !testCmdDone(cmdDone, 5*time.Millisecond) {
+		t.Fatal("command should finish with no commands outstanding")
+	}
+}
+
+func TestCommandQueueNoWaitOnReadOnly(t *testing.T) {
+	cq := NewCommandQueue()
+	wg := sync.WaitGroup{}
+	// Add a read-only command.
+	wk := cq.Add(engine.Key("a"), nil, true)
+	// Verify no wait on another read-only command.
+	cq.GetWait(engine.Key("a"), nil, true, &wg)
+	wg.Wait()
+	// Verify wait with a read-write command.
+	cq.GetWait(engine.Key("a"), nil, false, &wg)
+	cmdDone := waitForCmd(&wg)
+	if testCmdDone(cmdDone, 1*time.Millisecond) {
+		t.Fatal("command should not finish with command outstanding")
+	}
+	cq.Remove(wk)
+	if !testCmdDone(cmdDone, 5*time.Millisecond) {
+		t.Fatal("command should finish with no commands outstanding")
+	}
+}
+
+func TestCommandQueueMultipleExecutingCommands(t *testing.T) {
+	cq := NewCommandQueue()
+	wg := sync.WaitGroup{}
+
+	// Add multiple commands and add a command which overlaps them all.
+	wk1 := cq.Add(engine.Key("a"), nil, false)
+	wk2 := cq.Add(engine.Key("b"), engine.Key("c"), false)
+	wk3 := cq.Add(engine.Key("0"), engine.Key("d"), false)
+	cq.GetWait(engine.Key("a"), engine.Key("cc"), false, &wg)
+	cmdDone := waitForCmd(&wg)
+	cq.Remove(wk1)
+	if testCmdDone(cmdDone, 1*time.Millisecond) {
+		t.Fatal("command should not finish with two commands outstanding")
+	}
+	cq.Remove(wk2)
+	if testCmdDone(cmdDone, 1*time.Millisecond) {
+		t.Fatal("command should not finish with one command outstanding")
+	}
+	cq.Remove(wk3)
+	if !testCmdDone(cmdDone, 5*time.Millisecond) {
+		t.Fatal("command should finish with no commands outstanding")
+	}
+}
+
+func TestCommandQueueMultiplePendingCommands(t *testing.T) {
+	cq := NewCommandQueue()
+	wg1 := sync.WaitGroup{}
+	wg2 := sync.WaitGroup{}
+	wg3 := sync.WaitGroup{}
+
+	// Add a command which will overlap all commands.
+	wk := cq.Add(engine.Key("a"), engine.Key("d"), false)
+	cq.GetWait(engine.Key("a"), nil, false, &wg1)
+	cq.GetWait(engine.Key("b"), nil, false, &wg2)
+	cq.GetWait(engine.Key("c"), nil, false, &wg3)
+	cmdDone1 := waitForCmd(&wg1)
+	cmdDone2 := waitForCmd(&wg2)
+	cmdDone3 := waitForCmd(&wg3)
+
+	if testCmdDone(cmdDone1, 1*time.Millisecond) ||
+		testCmdDone(cmdDone2, 1*time.Millisecond) ||
+		testCmdDone(cmdDone3, 1*time.Millisecond) {
+		t.Fatal("no commands should finish with command outstanding")
+	}
+	cq.Remove(wk)
+	if !testCmdDone(cmdDone1, 5*time.Millisecond) ||
+		!testCmdDone(cmdDone2, 5*time.Millisecond) ||
+		!testCmdDone(cmdDone3, 5*time.Millisecond) {
+		t.Fatal("commands should finish with no commands outstanding")
+	}
+}
+
+func TestCommandQueueClear(t *testing.T) {
+	cq := NewCommandQueue()
+	wg1 := sync.WaitGroup{}
+	wg2 := sync.WaitGroup{}
+
+	// Add multiple commands and commands which access each.
+	cq.Add(engine.Key("a"), nil, false)
+	cq.Add(engine.Key("b"), nil, false)
+	cq.GetWait(engine.Key("a"), nil, false, &wg1)
+	cq.GetWait(engine.Key("b"), nil, false, &wg2)
+	cmdDone1 := waitForCmd(&wg1)
+	cmdDone2 := waitForCmd(&wg2)
+
+	// Clear the queue and verify both commands are signaled.
+	cq.Clear()
+
+	if !testCmdDone(cmdDone1, 1*time.Millisecond) ||
+		!testCmdDone(cmdDone2, 1*time.Millisecond) {
+		t.Fatal("commands should finish when clearing queue")
+	}
+}
@@ -127,7 +127,7 @@ func (in *InMem) Put(key Key, value []byte) error {
 	return in.putLocked(key, value)
 }
 
-// putLocked assumes mutex is already held by caller. See put().
+// putLocked assumes mutex is already held by caller. See Put().
 func (in *InMem) putLocked(key Key, value []byte) error {
 	if len(key) == 0 {
 		return emptyKeyError()
Original file line number	Diff line number	Diff line change
`@@ -127,7 +127,7 @@ func (in *InMem) Put(key Key, value []byte) error {`
`127`	`127`	`return in.putLocked(key, value)`
`128`	`128`	`}`
`129`	`129`
`130`		`-// putLocked assumes mutex is already held by caller. See put().`
	`130`	`+// putLocked assumes mutex is already held by caller. See Put().`
`131`	`131`	`func (in *InMem) putLocked(key Key, value []byte) error {`
`132`	`132`	`if len(key) == 0 {`
`133`	`133`	`return emptyKeyError()`