Work on timer teardown + bug fixes

Added waitgroups to peer struct for routine
start / stop synchronisation
This commit is contained in:
Mathias Hall-Andersen 2018-01-13 09:00:37 +01:00
parent d73f960aab
commit 1dd590b91b
8 changed files with 102 additions and 47 deletions

View file

@ -64,13 +64,9 @@ func unsafeCloseBind(device *Device) error {
return err return err
} }
func updateBind(device *Device) error { /* Must hold device and net lock
device.mutex.Lock() */
defer device.mutex.Unlock() func unsafeUpdateBind(device *Device) error {
netc := &device.net
netc.mutex.Lock()
defer netc.mutex.Unlock()
// close existing sockets // close existing sockets
@ -89,6 +85,7 @@ func updateBind(device *Device) error {
// bind to new port // bind to new port
var err error var err error
netc := &device.net
netc.bind, netc.port, err = CreateBind(netc.port) netc.bind, netc.port, err = CreateBind(netc.port)
if err != nil { if err != nil {
netc.bind = nil netc.bind = nil

View file

@ -1,6 +1,7 @@
package main package main
import ( import (
"github.com/sasha-s/go-deadlock"
"runtime" "runtime"
"sync" "sync"
"sync/atomic" "sync/atomic"
@ -21,12 +22,12 @@ type Device struct {
messageBuffers sync.Pool messageBuffers sync.Pool
} }
net struct { net struct {
mutex sync.RWMutex mutex deadlock.RWMutex
bind Bind // bind interface bind Bind // bind interface
port uint16 // listening port port uint16 // listening port
fwmark uint32 // mark value (0 = disabled) fwmark uint32 // mark value (0 = disabled)
} }
mutex sync.RWMutex mutex deadlock.RWMutex
privateKey NoisePrivateKey privateKey NoisePrivateKey
publicKey NoisePublicKey publicKey NoisePublicKey
routingTable RoutingTable routingTable RoutingTable
@ -49,8 +50,15 @@ func (device *Device) Up() {
device.mutex.Lock() device.mutex.Lock()
defer device.mutex.Unlock() defer device.mutex.Unlock()
device.isUp.Set(true) device.net.mutex.Lock()
updateBind(device) defer device.net.mutex.Unlock()
if device.isUp.Swap(true) {
return
}
unsafeUpdateBind(device)
for _, peer := range device.peers { for _, peer := range device.peers {
peer.Start() peer.Start()
} }
@ -60,8 +68,12 @@ func (device *Device) Down() {
device.mutex.Lock() device.mutex.Lock()
defer device.mutex.Unlock() defer device.mutex.Unlock()
device.isUp.Set(false) if !device.isUp.Swap(false) {
return
}
closeBind(device) closeBind(device)
for _, peer := range device.peers { for _, peer := range device.peers {
peer.Stop() peer.Stop()
} }
@ -75,7 +87,6 @@ func removePeerUnsafe(device *Device, key NoisePublicKey) {
if !ok { if !ok {
return return
} }
peer.mutex.Lock()
peer.Stop() peer.Stop()
device.routingTable.RemovePeer(peer) device.routingTable.RemovePeer(peer)
delete(device.peers, key) delete(device.peers, key)

View file

@ -8,6 +8,10 @@ import (
"time" "time"
) )
const (
PeerRoutineNumber = 4
)
type Peer struct { type Peer struct {
id uint id uint
mutex sync.RWMutex mutex sync.RWMutex
@ -34,7 +38,6 @@ type Peer struct {
flushNonceQueue Signal // size 1, empty queued packets flushNonceQueue Signal // size 1, empty queued packets
messageSend Signal // size 1, message was send to peer messageSend Signal // size 1, message was send to peer
messageReceived Signal // size 1, authenticated message recv messageReceived Signal // size 1, authenticated message recv
stop Signal // size 0, stop all goroutines in peer
} }
timer struct { timer struct {
// state related to WireGuard timers // state related to WireGuard timers
@ -54,6 +57,12 @@ type Peer struct {
outbound chan *QueueOutboundElement // sequential ordering of work outbound chan *QueueOutboundElement // sequential ordering of work
inbound chan *QueueInboundElement // sequential ordering of work inbound chan *QueueInboundElement // sequential ordering of work
} }
routines struct {
mutex sync.Mutex // held when stopping / starting routines
starting sync.WaitGroup // routines pending start
stopping sync.WaitGroup // routines pending stop
stop Signal // size 0, stop all goroutines in peer
}
mac CookieGenerator mac CookieGenerator
} }
@ -121,6 +130,10 @@ func (device *Device) NewPeer(pk NoisePublicKey) (*Peer, error) {
peer.signal.handshakeCompleted = NewSignal() peer.signal.handshakeCompleted = NewSignal()
peer.signal.flushNonceQueue = NewSignal() peer.signal.flushNonceQueue = NewSignal()
peer.routines.mutex.Lock()
peer.routines.stop = NewSignal()
peer.routines.mutex.Unlock()
return peer, nil return peer, nil
} }
@ -156,32 +169,43 @@ func (peer *Peer) String() string {
) )
} }
/* Starts all routines for a given peer func (peer *Peer) Start() {
*
* Requires that the caller holds the exclusive peer lock!
*/
func unsafePeerStart(peer *Peer) {
peer.signal.stop.Broadcast()
peer.signal.stop = NewSignal()
var wait sync.WaitGroup peer.routines.mutex.Lock()
defer peer.routines.mutex.Lock()
wait.Add(1) // stop & wait for ungoing routines (if any)
peer.routines.stop.Broadcast()
peer.routines.starting.Wait()
peer.routines.stopping.Wait()
// reset signal and start (new) routines
peer.routines.stop = NewSignal()
peer.routines.starting.Add(PeerRoutineNumber)
peer.routines.stopping.Add(PeerRoutineNumber)
go peer.RoutineNonce() go peer.RoutineNonce()
go peer.RoutineTimerHandler(&wait) go peer.RoutineTimerHandler()
go peer.RoutineSequentialSender() go peer.RoutineSequentialSender()
go peer.RoutineSequentialReceiver() go peer.RoutineSequentialReceiver()
wait.Wait() peer.routines.starting.Wait()
}
func (peer *Peer) Start() {
peer.mutex.Lock()
unsafePeerStart(peer)
peer.mutex.Unlock()
} }
func (peer *Peer) Stop() { func (peer *Peer) Stop() {
peer.signal.stop.Broadcast()
peer.routines.mutex.Lock()
defer peer.routines.mutex.Lock()
// stop & wait for ungoing routines (if any)
peer.routines.stop.Broadcast()
peer.routines.starting.Wait()
peer.routines.stopping.Wait()
// reset signal (to handle repeated stopping)
peer.routines.stop = NewSignal()
} }

View file

@ -497,7 +497,7 @@ func (peer *Peer) RoutineSequentialReceiver() {
select { select {
case <-peer.signal.stop.Wait(): case <-peer.routines.stop.Wait():
logDebug.Println("Routine, sequential receiver, stopped for peer", peer.id) logDebug.Println("Routine, sequential receiver, stopped for peer", peer.id)
return return

View file

@ -192,7 +192,7 @@ func (peer *Peer) RoutineNonce() {
for { for {
NextPacket: NextPacket:
select { select {
case <-peer.signal.stop.Wait(): case <-peer.routines.stop.Wait():
return return
case elem := <-peer.queue.nonce: case elem := <-peer.queue.nonce:
@ -217,7 +217,7 @@ func (peer *Peer) RoutineNonce() {
logDebug.Println("Clearing queue for", peer.String()) logDebug.Println("Clearing queue for", peer.String())
peer.FlushNonceQueue() peer.FlushNonceQueue()
goto NextPacket goto NextPacket
case <-peer.signal.stop.Wait(): case <-peer.routines.stop.Wait():
return return
} }
} }
@ -309,15 +309,20 @@ func (device *Device) RoutineEncryption() {
* The routine terminates then the outbound queue is closed. * The routine terminates then the outbound queue is closed.
*/ */
func (peer *Peer) RoutineSequentialSender() { func (peer *Peer) RoutineSequentialSender() {
defer peer.routines.stopping.Done()
device := peer.device device := peer.device
logDebug := device.log.Debug logDebug := device.log.Debug
logDebug.Println("Routine, sequential sender, started for", peer.String()) logDebug.Println("Routine, sequential sender, started for", peer.String())
peer.routines.starting.Done()
for { for {
select { select {
case <-peer.signal.stop.Wait(): case <-peer.routines.stop.Wait():
logDebug.Println( logDebug.Println(
"Routine, sequential sender, stopped for", peer.String()) "Routine, sequential sender, stopped for", peer.String())
return return

View file

@ -4,7 +4,6 @@ import (
"bytes" "bytes"
"encoding/binary" "encoding/binary"
"math/rand" "math/rand"
"sync"
"sync/atomic" "sync/atomic"
"time" "time"
) )
@ -182,7 +181,10 @@ func (peer *Peer) sendNewHandshake() error {
return err return err
} }
func (peer *Peer) RoutineTimerHandler(ready *sync.WaitGroup) { func (peer *Peer) RoutineTimerHandler() {
defer peer.routines.stopping.Done()
device := peer.device device := peer.device
logInfo := device.log.Info logInfo := device.log.Info
@ -203,15 +205,20 @@ func (peer *Peer) RoutineTimerHandler(ready *sync.WaitGroup) {
peer.timer.keepalivePersistent.Reset(duration) peer.timer.keepalivePersistent.Reset(duration)
} }
// signal that timers are reset // signal synchronised setup complete
ready.Done() peer.routines.starting.Done()
// handle timer events // handle timer events
for { for {
select { select {
/* stopping */
case <-peer.routines.stop.Wait():
return
/* timers */ /* timers */
// keep-alive // keep-alive
@ -312,9 +319,6 @@ func (peer *Peer) RoutineTimerHandler(ready *sync.WaitGroup) {
/* signals */ /* signals */
case <-peer.signal.stop.Wait():
return
case <-peer.signal.handshakeBegin.Wait(): case <-peer.signal.handshakeBegin.Wait():
peer.signal.handshakeBegin.Disable() peer.signal.handshakeBegin.Disable()

View file

@ -45,14 +45,14 @@ func (device *Device) RoutineTUNEventReader() {
} }
} }
if event&TUNEventUp != 0 { if event&TUNEventUp != 0 && !device.isUp.Get() {
logInfo.Println("Interface set up") logInfo.Println("Interface set up")
device.Up() device.Up()
} }
if event&TUNEventDown != 0 { if event&TUNEventDown != 0 && device.isUp.Get() {
logInfo.Println("Interface set down") logInfo.Println("Interface set down")
device.Up() device.Down()
} }
} }
} }

View file

@ -133,13 +133,27 @@ func ipcSetOperation(device *Device, socket *bufio.ReadWriter) *IPCError {
device.SetPrivateKey(sk) device.SetPrivateKey(sk)
case "listen_port": case "listen_port":
// parse port number
port, err := strconv.ParseUint(value, 10, 16) port, err := strconv.ParseUint(value, 10, 16)
if err != nil { if err != nil {
logError.Println("Failed to parse listen_port:", err) logError.Println("Failed to parse listen_port:", err)
return &IPCError{Code: ipcErrorInvalid} return &IPCError{Code: ipcErrorInvalid}
} }
// update port and rebind
device.mutex.Lock()
device.net.mutex.Lock()
device.net.port = uint16(port) device.net.port = uint16(port)
if err := updateBind(device); err != nil { err = unsafeUpdateBind(device)
device.net.mutex.Unlock()
device.mutex.Unlock()
if err != nil {
logError.Println("Failed to set listen_port:", err) logError.Println("Failed to set listen_port:", err)
return &IPCError{Code: ipcErrorPortInUse} return &IPCError{Code: ipcErrorPortInUse}
} }