Streamline error handling and locking, with fix for close() race

This commit is contained in:
Jakob Borg 2014-05-04 17:40:40 +02:00
parent 10e8861f14
commit 482795bab0
1 changed files with 118 additions and 120 deletions

View File

@ -64,24 +64,24 @@ type Connection interface {
} }
type rawConnection struct { type rawConnection struct {
sync.RWMutex id string
receiver Model
reader io.ReadCloser
cr *countingReader
xr *xdr.Reader
writer io.WriteCloser
cw *countingWriter
wb *bufio.Writer
xw *xdr.Writer
wmut sync.Mutex
closed bool
id string
receiver Model
reader io.ReadCloser
cr *countingReader
xr *xdr.Reader
writer io.WriteCloser
cw *countingWriter
wb *bufio.Writer
xw *xdr.Writer
closed chan struct{}
awaiting map[int]chan asyncResult awaiting map[int]chan asyncResult
nextID int nextID int
indexSent map[string]map[string][2]int64 indexSent map[string]map[string][2]int64
imut sync.Mutex
hasSentIndex bool
hasRecvdIndex bool
} }
type asyncResult struct { type asyncResult struct {
@ -115,7 +115,6 @@ func NewConnection(nodeID string, reader io.Reader, writer io.Writer, receiver M
cw: cw, cw: cw,
wb: wb, wb: wb,
xw: xdr.NewWriter(wb), xw: xdr.NewWriter(wb),
closed: make(chan struct{}),
awaiting: make(map[int]chan asyncResult), awaiting: make(map[int]chan asyncResult),
indexSent: make(map[string]map[string][2]int64), indexSent: make(map[string]map[string][2]int64),
} }
@ -132,11 +131,11 @@ func (c *rawConnection) ID() string {
// Index writes the list of file information to the connected peer node // Index writes the list of file information to the connected peer node
func (c *rawConnection) Index(repo string, idx []FileInfo) { func (c *rawConnection) Index(repo string, idx []FileInfo) {
c.Lock()
if c.isClosed() { if c.isClosed() {
c.Unlock()
return return
} }
c.imut.Lock()
var msgType int var msgType int
if c.indexSent[repo] == nil { if c.indexSent[repo] == nil {
// This is the first time we send an index. // This is the first time we send an index.
@ -159,14 +158,15 @@ func (c *rawConnection) Index(repo string, idx []FileInfo) {
idx = diff idx = diff
} }
header{0, c.nextID, msgType}.encodeXDR(c.xw) id := c.nextID
_, err := IndexMessage{repo, idx}.encodeXDR(c.xw)
if err == nil {
err = c.flush()
}
c.nextID = (c.nextID + 1) & 0xfff c.nextID = (c.nextID + 1) & 0xfff
c.hasSentIndex = true c.imut.Unlock()
c.Unlock()
c.wmut.Lock()
header{0, id, msgType}.encodeXDR(c.xw)
IndexMessage{repo, idx}.encodeXDR(c.xw)
err := c.flush()
c.wmut.Unlock()
if err != nil { if err != nil {
c.close(err) c.close(err)
@ -176,28 +176,30 @@ func (c *rawConnection) Index(repo string, idx []FileInfo) {
// Request returns the bytes for the specified block after fetching them from the connected peer. // Request returns the bytes for the specified block after fetching them from the connected peer.
func (c *rawConnection) Request(repo string, name string, offset int64, size int) ([]byte, error) { func (c *rawConnection) Request(repo string, name string, offset int64, size int) ([]byte, error) {
c.Lock()
if c.isClosed() { if c.isClosed() {
c.Unlock()
return nil, ErrClosed return nil, ErrClosed
} }
c.imut.Lock()
id := c.nextID
c.nextID = (c.nextID + 1) & 0xfff
rc := make(chan asyncResult) rc := make(chan asyncResult)
if _, ok := c.awaiting[c.nextID]; ok { if _, ok := c.awaiting[id]; ok {
panic("id taken") panic("id taken")
} }
c.awaiting[c.nextID] = rc c.awaiting[id] = rc
header{0, c.nextID, messageTypeRequest}.encodeXDR(c.xw) c.imut.Unlock()
_, err := RequestMessage{repo, name, uint64(offset), uint32(size)}.encodeXDR(c.xw)
if err == nil { c.wmut.Lock()
err = c.flush() header{0, id, messageTypeRequest}.encodeXDR(c.xw)
} RequestMessage{repo, name, uint64(offset), uint32(size)}.encodeXDR(c.xw)
err := c.flush()
c.wmut.Unlock()
if err != nil { if err != nil {
c.Unlock()
c.close(err) c.close(err)
return nil, err return nil, err
} }
c.nextID = (c.nextID + 1) & 0xfff
c.Unlock()
res, ok := <-rc res, ok := <-rc
if !ok { if !ok {
@ -208,46 +210,47 @@ func (c *rawConnection) Request(repo string, name string, offset int64, size int
// ClusterConfig send the cluster configuration message to the peer and returns any error // ClusterConfig send the cluster configuration message to the peer and returns any error
func (c *rawConnection) ClusterConfig(config ClusterConfigMessage) { func (c *rawConnection) ClusterConfig(config ClusterConfigMessage) {
c.Lock()
defer c.Unlock()
if c.isClosed() { if c.isClosed() {
return return
} }
header{0, c.nextID, messageTypeClusterConfig}.encodeXDR(c.xw) c.imut.Lock()
id := c.nextID
c.nextID = (c.nextID + 1) & 0xfff c.nextID = (c.nextID + 1) & 0xfff
c.imut.Unlock()
c.wmut.Lock()
header{0, id, messageTypeClusterConfig}.encodeXDR(c.xw)
config.encodeXDR(c.xw)
err := c.flush()
c.wmut.Unlock()
_, err := config.encodeXDR(c.xw)
if err == nil {
err = c.flush()
}
if err != nil { if err != nil {
c.close(err) c.close(err)
} }
} }
func (c *rawConnection) ping() bool { func (c *rawConnection) ping() bool {
c.Lock()
if c.isClosed() { if c.isClosed() {
c.Unlock()
return false return false
} }
c.imut.Lock()
id := c.nextID
c.nextID = (c.nextID + 1) & 0xfff
rc := make(chan asyncResult, 1) rc := make(chan asyncResult, 1)
c.awaiting[c.nextID] = rc c.awaiting[id] = rc
header{0, c.nextID, messageTypePing}.encodeXDR(c.xw) c.imut.Unlock()
c.wmut.Lock()
header{0, id, messageTypePing}.encodeXDR(c.xw)
err := c.flush() err := c.flush()
c.wmut.Unlock()
if err != nil { if err != nil {
c.Unlock()
c.close(err) c.close(err)
return false return false
} else if c.xw.Error() != nil {
c.Unlock()
c.close(c.xw.Error())
return false
} }
c.nextID = (c.nextID + 1) & 0xfff
c.Unlock()
res, ok := <-rc res, ok := <-rc
return ok && res.err == nil return ok && res.err == nil
@ -258,40 +261,47 @@ type flusher interface {
} }
func (c *rawConnection) flush() error { func (c *rawConnection) flush() error {
c.wb.Flush() if err := c.xw.Error(); err != nil {
return err
}
if err := c.wb.Flush(); err != nil {
return err
}
if f, ok := c.writer.(flusher); ok { if f, ok := c.writer.(flusher); ok {
return f.Flush() return f.Flush()
} }
return nil return nil
} }
func (c *rawConnection) close(err error) { func (c *rawConnection) close(err error) {
c.Lock() c.imut.Lock()
select { c.wmut.Lock()
case <-c.closed: defer c.imut.Unlock()
c.Unlock() defer c.wmut.Unlock()
if c.closed {
return return
default:
} }
close(c.closed)
c.closed = true
for _, ch := range c.awaiting { for _, ch := range c.awaiting {
close(ch) close(ch)
} }
c.awaiting = nil c.awaiting = nil
c.writer.Close() c.writer.Close()
c.reader.Close() c.reader.Close()
c.Unlock()
c.receiver.Close(c.id, err) c.receiver.Close(c.id, err)
} }
func (c *rawConnection) isClosed() bool { func (c *rawConnection) isClosed() bool {
select { c.wmut.Lock()
case <-c.closed: defer c.wmut.Unlock()
return true return c.closed
default:
return false
}
} }
func (c *rawConnection) readerLoop() { func (c *rawConnection) readerLoop() {
@ -299,8 +309,8 @@ loop:
for !c.isClosed() { for !c.isClosed() {
var hdr header var hdr header
hdr.decodeXDR(c.xr) hdr.decodeXDR(c.xr)
if c.xr.Error() != nil { if err := c.xr.Error(); err != nil {
c.close(c.xr.Error()) c.close(err)
break loop break loop
} }
if hdr.version != 0 { if hdr.version != 0 {
@ -312,8 +322,8 @@ loop:
case messageTypeIndex: case messageTypeIndex:
var im IndexMessage var im IndexMessage
im.decodeXDR(c.xr) im.decodeXDR(c.xr)
if c.xr.Error() != nil { if err := c.xr.Error(); err != nil {
c.close(c.xr.Error()) c.close(err)
break loop break loop
} else { } else {
@ -326,15 +336,12 @@ loop:
go c.receiver.Index(c.id, im.Repository, im.Files) go c.receiver.Index(c.id, im.Repository, im.Files)
} }
c.Lock()
c.hasRecvdIndex = true
c.Unlock()
case messageTypeIndexUpdate: case messageTypeIndexUpdate:
var im IndexMessage var im IndexMessage
im.decodeXDR(c.xr) im.decodeXDR(c.xr)
if c.xr.Error() != nil { if err := c.xr.Error(); err != nil {
c.close(c.xr.Error()) c.close(err)
break loop break loop
} else { } else {
go c.receiver.IndexUpdate(c.id, im.Repository, im.Files) go c.receiver.IndexUpdate(c.id, im.Repository, im.Files)
@ -343,8 +350,8 @@ loop:
case messageTypeRequest: case messageTypeRequest:
var req RequestMessage var req RequestMessage
req.decodeXDR(c.xr) req.decodeXDR(c.xr)
if c.xr.Error() != nil { if err := c.xr.Error(); err != nil {
c.close(c.xr.Error()) c.close(err)
break loop break loop
} }
go c.processRequest(hdr.msgID, req) go c.processRequest(hdr.msgID, req)
@ -352,16 +359,16 @@ loop:
case messageTypeResponse: case messageTypeResponse:
data := c.xr.ReadBytesMax(256 * 1024) // Sufficiently larger than max expected block size data := c.xr.ReadBytesMax(256 * 1024) // Sufficiently larger than max expected block size
if c.xr.Error() != nil { if err := c.xr.Error(); err != nil {
c.close(c.xr.Error()) c.close(err)
break loop break loop
} }
go func(hdr header, err error) { go func(hdr header, err error) {
c.Lock() c.imut.Lock()
rc, ok := c.awaiting[hdr.msgID] rc, ok := c.awaiting[hdr.msgID]
delete(c.awaiting, hdr.msgID) delete(c.awaiting, hdr.msgID)
c.Unlock() c.imut.Unlock()
if ok { if ok {
rc <- asyncResult{data, err} rc <- asyncResult{data, err}
@ -370,37 +377,34 @@ loop:
}(hdr, c.xr.Error()) }(hdr, c.xr.Error())
case messageTypePing: case messageTypePing:
c.Lock() c.wmut.Lock()
header{0, hdr.msgID, messageTypePong}.encodeXDR(c.xw) header{0, hdr.msgID, messageTypePong}.encodeXDR(c.xw)
err := c.flush() err := c.flush()
c.Unlock() c.wmut.Unlock()
if err != nil { if err != nil {
c.close(err) c.close(err)
break loop break loop
} else if c.xw.Error() != nil {
c.close(c.xw.Error())
break loop
} }
case messageTypePong: case messageTypePong:
c.RLock() c.imut.Lock()
rc, ok := c.awaiting[hdr.msgID] rc, ok := c.awaiting[hdr.msgID]
c.RUnlock()
if ok { if ok {
rc <- asyncResult{} go func() {
close(rc) rc <- asyncResult{}
close(rc)
}()
c.Lock()
delete(c.awaiting, hdr.msgID) delete(c.awaiting, hdr.msgID)
c.Unlock()
} }
c.imut.Unlock()
case messageTypeClusterConfig: case messageTypeClusterConfig:
var cm ClusterConfigMessage var cm ClusterConfigMessage
cm.decodeXDR(c.xr) cm.decodeXDR(c.xr)
if c.xr.Error() != nil { if err := c.xr.Error(); err != nil {
c.close(c.xr.Error()) c.close(err)
break loop break loop
} else { } else {
go c.receiver.ClusterConfig(c.id, cm) go c.receiver.ClusterConfig(c.id, cm)
@ -416,15 +420,14 @@ loop:
func (c *rawConnection) processRequest(msgID int, req RequestMessage) { func (c *rawConnection) processRequest(msgID int, req RequestMessage) {
data, _ := c.receiver.Request(c.id, req.Repository, req.Name, int64(req.Offset), int(req.Size)) data, _ := c.receiver.Request(c.id, req.Repository, req.Name, int64(req.Offset), int(req.Size))
c.Lock() c.wmut.Lock()
header{0, msgID, messageTypeResponse}.encodeXDR(c.xw) header{0, msgID, messageTypeResponse}.encodeXDR(c.xw)
_, err := c.xw.WriteBytes(data) c.xw.WriteBytes(data)
if err == nil { err := c.flush()
err = c.flush() c.wmut.Unlock()
}
c.Unlock()
buffers.Put(data) buffers.Put(data)
if err != nil { if err != nil {
c.close(err) c.close(err)
} }
@ -434,27 +437,22 @@ func (c *rawConnection) pingerLoop() {
var rc = make(chan bool, 1) var rc = make(chan bool, 1)
ticker := time.Tick(pingIdleTime / 2) ticker := time.Tick(pingIdleTime / 2)
for { for {
if c.isClosed() {
return
}
select { select {
case <-ticker: case <-ticker:
c.RLock() go func() {
ready := c.hasRecvdIndex && c.hasSentIndex rc <- c.ping()
c.RUnlock() }()
select {
if ready { case ok := <-rc:
go func() { if !ok {
rc <- c.ping() c.close(fmt.Errorf("ping failure"))
}()
select {
case ok := <-rc:
if !ok {
c.close(fmt.Errorf("ping failure"))
}
case <-time.After(pingTimeout):
c.close(fmt.Errorf("ping timeout"))
} }
case <-time.After(pingTimeout):
c.close(fmt.Errorf("ping timeout"))
} }
case <-c.closed:
return
} }
} }
} }