aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorChris Lu <chrislusf@users.noreply.github.com>2020-09-21 19:49:15 -0700
committerGitHub <noreply@github.com>2020-09-21 19:49:15 -0700
commitec5b9f1e91a8609d0e70bf9d26dc0840774153c4 (patch)
tree48ede45893c2130d3e039f7fe4af8440835eb02d
parent9cdbfc1a4987bdb46f16ae37624ed69ef66778a9 (diff)
parent658fc2e5b619c453ddecc805bc363a25f75ff22d (diff)
downloadseaweedfs-ec5b9f1e91a8609d0e70bf9d26dc0840774153c4.tar.xz
seaweedfs-ec5b9f1e91a8609d0e70bf9d26dc0840774153c4.zip
Merge pull request #1475 from levenlabs/lock
Fix deadlock with KeepConnected and SendHeartbeat
-rw-r--r--weed/command/server.go2
-rw-r--r--weed/server/master_grpc_server.go10
2 files changed, 9 insertions, 3 deletions
diff --git a/weed/command/server.go b/weed/command/server.go
index 6f40263bb..aee62290a 100644
--- a/weed/command/server.go
+++ b/weed/command/server.go
@@ -99,7 +99,7 @@ func init() {
serverOptions.v.fileSizeLimitMB = cmdServer.Flag.Int("volume.fileSizeLimitMB", 1024, "limit file size to avoid out of memory")
serverOptions.v.publicUrl = cmdServer.Flag.String("volume.publicUrl", "", "publicly accessible address")
serverOptions.v.preStopSeconds = cmdServer.Flag.Int("volume.preStopSeconds", 10, "number of seconds between stop send heartbeats and stop volume server")
- serverOptions.v.pprof = &False
+ serverOptions.v.pprof = cmdServer.Flag.Bool("volume.pprof", false, "enable pprof http handlers. precludes --memprofile and --cpuprofile")
s3Options.port = cmdServer.Flag.Int("s3.port", 8333, "s3 server http listen port")
s3Options.domainName = cmdServer.Flag.String("s3.domainName", "", "suffix of the host name, {bucket}.{domainName}")
diff --git a/weed/server/master_grpc_server.go b/weed/server/master_grpc_server.go
index f3a2ee013..692909a29 100644
--- a/weed/server/master_grpc_server.go
+++ b/weed/server/master_grpc_server.go
@@ -187,7 +187,8 @@ func (ms *MasterServer) KeepConnected(stream master_pb.Seaweed_KeepConnectedServ
peerAddress := findClientAddress(stream.Context(), req.GrpcPort)
- stopChan := make(chan bool)
+ // buffer by 1 so we don't end up getting stuck writing to stopChan forever
+ stopChan := make(chan bool, 1)
clientName, messageChan := ms.addClient(req.Name, peerAddress)
@@ -247,7 +248,12 @@ func (ms *MasterServer) addClient(clientType string, clientAddress string) (clie
clientName = clientType + "@" + clientAddress
glog.V(0).Infof("+ client %v", clientName)
- messageChan = make(chan *master_pb.VolumeLocation)
+ // we buffer this because otherwise we end up in a potential deadlock where
+ // the KeepConnected loop is no longer listening on this channel but we're
+ // trying to send to it in SendHeartbeat and so we can't lock the
+ // clientChansLock to remove the channel and we're stuck writing to it
+ // 100 is probably overkill
+ messageChan = make(chan *master_pb.VolumeLocation, 100)
ms.clientChansLock.Lock()
ms.clientChans[clientName] = messageChan