Auto-reconnect for regular authRPC client. (#3506)

Implement a storage rpc specific rpc client,
which does not reconnect unnecessarily.

Instead reconnect is handled at a different
layer for storage alone.

Rest of the calls using AuthRPC automatically
reconnect, i.e upon an error equal to `rpc.ErrShutdown`
they dial again and call the requested method again.
This commit is contained in:
Harshavardhana 2016-12-29 19:42:02 -08:00 committed by GitHub
parent 41cf580bb1
commit dd68cdd802
5 changed files with 155 additions and 90 deletions

View File

@ -17,7 +17,6 @@
package cmd package cmd
import ( import (
"net/rpc"
"net/url" "net/url"
"path" "path"
"sync" "sync"
@ -58,22 +57,14 @@ func (lc localAdminClient) Restart() error {
func (rc remoteAdminClient) Stop() error { func (rc remoteAdminClient) Stop() error {
args := GenericArgs{} args := GenericArgs{}
reply := GenericReply{} reply := GenericReply{}
err := rc.Call("Service.Shutdown", &args, &reply) return rc.Call("Service.Shutdown", &args, &reply)
if err != nil && err == rpc.ErrShutdown {
rc.Close()
}
return err
} }
// Restart - Sends restart command to remote server via RPC. // Restart - Sends restart command to remote server via RPC.
func (rc remoteAdminClient) Restart() error { func (rc remoteAdminClient) Restart() error {
args := GenericArgs{} args := GenericArgs{}
reply := GenericReply{} reply := GenericReply{}
err := rc.Call("Service.Restart", &args, &reply) return rc.Call("Service.Restart", &args, &reply)
if err != nil && err == rpc.ErrShutdown {
rc.Close()
}
return err
} }
// adminPeer - represents an entity that implements Stop and Restart methods. // adminPeer - represents an entity that implements Stop and Restart methods.

View File

@ -76,7 +76,6 @@ type AuthRPCClient struct {
mu sync.Mutex mu sync.Mutex
config *authConfig config *authConfig
rpc *RPCClient // reconnect'able rpc client built on top of net/rpc Client rpc *RPCClient // reconnect'able rpc client built on top of net/rpc Client
isLoggedIn bool // Indicates if the auth client has been logged in and token is valid.
serverToken string // Disk rpc JWT based token. serverToken string // Disk rpc JWT based token.
serverVersion string // Server version exchanged by the RPC. serverVersion string // Server version exchanged by the RPC.
} }
@ -88,8 +87,6 @@ func newAuthClient(cfg *authConfig) *AuthRPCClient {
config: cfg, config: cfg,
// Initialize a new reconnectable rpc client. // Initialize a new reconnectable rpc client.
rpc: newRPCClient(cfg.address, cfg.path, cfg.secureConn), rpc: newRPCClient(cfg.address, cfg.path, cfg.secureConn),
// Allocated auth client not logged in yet.
isLoggedIn: false,
} }
} }
@ -97,7 +94,7 @@ func newAuthClient(cfg *authConfig) *AuthRPCClient {
func (authClient *AuthRPCClient) Close() error { func (authClient *AuthRPCClient) Close() error {
authClient.mu.Lock() authClient.mu.Lock()
// reset token on closing a connection // reset token on closing a connection
authClient.isLoggedIn = false authClient.serverToken = ""
authClient.mu.Unlock() authClient.mu.Unlock()
return authClient.rpc.Close() return authClient.rpc.Close()
} }
@ -109,7 +106,7 @@ func (authClient *AuthRPCClient) Login() (err error) {
defer authClient.mu.Unlock() defer authClient.mu.Unlock()
// Return if already logged in. // Return if already logged in.
if authClient.isLoggedIn { if authClient.serverToken != "" {
return nil return nil
} }
@ -135,7 +132,6 @@ func (authClient *AuthRPCClient) Login() (err error) {
// Set token, time stamp as received from a successful login call. // Set token, time stamp as received from a successful login call.
authClient.serverToken = reply.Token authClient.serverToken = reply.Token
authClient.serverVersion = reply.ServerVersion authClient.serverVersion = reply.ServerVersion
authClient.isLoggedIn = true
return nil return nil
} }
@ -146,21 +142,34 @@ func (authClient *AuthRPCClient) Call(serviceMethod string, args interface {
SetToken(token string) SetToken(token string)
SetTimestamp(tstamp time.Time) SetTimestamp(tstamp time.Time)
}, reply interface{}) (err error) { }, reply interface{}) (err error) {
// On successful login, attempt the call. loginAndCallFn := func() error {
// On successful login, proceed to attempt the requested service method.
if err = authClient.Login(); err == nil { if err = authClient.Login(); err == nil {
// Set token and timestamp before the rpc call. // Set token and timestamp before the rpc call.
args.SetToken(authClient.serverToken) args.SetToken(authClient.serverToken)
args.SetTimestamp(time.Now().UTC()) args.SetTimestamp(time.Now().UTC())
// Call the underlying rpc. // Finally make the network call using net/rpc client.
err = authClient.rpc.Call(serviceMethod, args, reply) err = authClient.rpc.Call(serviceMethod, args, reply)
// Invalidate token, and mark it for re-login on subsequent reconnect.
if err == rpc.ErrShutdown {
authClient.mu.Lock()
authClient.isLoggedIn = false
authClient.mu.Unlock()
} }
return err
}
doneCh := make(chan struct{})
defer close(doneCh)
for i := range newRetryTimer(time.Second, time.Second*30, MaxJitter, doneCh) {
// Invalidate token, and mark it for re-login and
// reconnect upon rpc shutdown.
if err = loginAndCallFn(); err == rpc.ErrShutdown {
// Close the underlying connection, and proceed to reconnect
// if we haven't reached the retry threshold.
authClient.Close()
// No need to return error until the retry count threshold has reached.
if i < globalMaxAuthRPCRetryThreshold {
continue
}
}
break
} }
return err return err
} }

View File

@ -16,10 +16,7 @@
package cmd package cmd
import ( import "encoding/json"
"encoding/json"
"net/rpc"
)
// BucketMetaState - Interface to update bucket metadata in-memory // BucketMetaState - Interface to update bucket metadata in-memory
// state. // state.
@ -112,62 +109,26 @@ type remoteBucketMetaState struct {
// change to remote peer via RPC call. // change to remote peer via RPC call.
func (rc *remoteBucketMetaState) UpdateBucketNotification(args *SetBucketNotificationPeerArgs) error { func (rc *remoteBucketMetaState) UpdateBucketNotification(args *SetBucketNotificationPeerArgs) error {
reply := GenericReply{} reply := GenericReply{}
err := rc.Call("S3.SetBucketNotificationPeer", args, &reply) return rc.Call("S3.SetBucketNotificationPeer", args, &reply)
// Check for network error and retry once.
if err != nil && err == rpc.ErrShutdown {
// Close the underlying connection to attempt once more.
rc.Close()
// Attempt again and proceed.
err = rc.Call("S3.SetBucketNotificationPeer", args, &reply)
}
return err
} }
// remoteBucketMetaState.UpdateBucketListener - sends bucket listener change to // remoteBucketMetaState.UpdateBucketListener - sends bucket listener change to
// remote peer via RPC call. // remote peer via RPC call.
func (rc *remoteBucketMetaState) UpdateBucketListener(args *SetBucketListenerPeerArgs) error { func (rc *remoteBucketMetaState) UpdateBucketListener(args *SetBucketListenerPeerArgs) error {
reply := GenericReply{} reply := GenericReply{}
err := rc.Call("S3.SetBucketListenerPeer", args, &reply) return rc.Call("S3.SetBucketListenerPeer", args, &reply)
// Check for network error and retry once.
if err != nil && err == rpc.ErrShutdown {
// Close the underlying connection to attempt once more.
rc.Close()
// Attempt again and proceed.
err = rc.Call("S3.SetBucketListenerPeer", args, &reply)
}
return err
} }
// remoteBucketMetaState.UpdateBucketPolicy - sends bucket policy change to remote // remoteBucketMetaState.UpdateBucketPolicy - sends bucket policy change to remote
// peer via RPC call. // peer via RPC call.
func (rc *remoteBucketMetaState) UpdateBucketPolicy(args *SetBucketPolicyPeerArgs) error { func (rc *remoteBucketMetaState) UpdateBucketPolicy(args *SetBucketPolicyPeerArgs) error {
reply := GenericReply{} reply := GenericReply{}
err := rc.Call("S3.SetBucketPolicyPeer", args, &reply) return rc.Call("S3.SetBucketPolicyPeer", args, &reply)
// Check for network error and retry once.
if err != nil && err == rpc.ErrShutdown {
// Close the underlying connection to attempt once more.
rc.Close()
// Attempt again and proceed.
err = rc.Call("S3.SetBucketPolicyPeer", args, &reply)
}
return err
} }
// remoteBucketMetaState.SendEvent - sends event for bucket listener to remote // remoteBucketMetaState.SendEvent - sends event for bucket listener to remote
// peer via RPC call. // peer via RPC call.
func (rc *remoteBucketMetaState) SendEvent(args *EventArgs) error { func (rc *remoteBucketMetaState) SendEvent(args *EventArgs) error {
reply := GenericReply{} reply := GenericReply{}
err := rc.Call("S3.Event", args, &reply) return rc.Call("S3.Event", args, &reply)
// Check for network error and retry once.
if err != nil && err == rpc.ErrShutdown {
// Close the underlying connection to attempt once more.
rc.Close()
// Attempt again and proceed.
err = rc.Call("S3.Event", args, &reply)
}
return err
} }

View File

@ -93,6 +93,10 @@ var (
// giving up on the remote disk entirely. // giving up on the remote disk entirely.
globalMaxStorageRetryThreshold = 3 globalMaxStorageRetryThreshold = 3
// Attempt to retry only this many number of times before
// giving up on the remote RPC entirely.
globalMaxAuthRPCRetryThreshold = 1
// Add new variable global values here. // Add new variable global values here.
) )

View File

@ -23,7 +23,9 @@ import (
"net/rpc" "net/rpc"
"net/url" "net/url"
"path" "path"
"sync"
"sync/atomic" "sync/atomic"
"time"
"github.com/minio/minio/pkg/disk" "github.com/minio/minio/pkg/disk"
) )
@ -32,7 +34,7 @@ type networkStorage struct {
networkIOErrCount int32 // ref: https://golang.org/pkg/sync/atomic/#pkg-note-BUG networkIOErrCount int32 // ref: https://golang.org/pkg/sync/atomic/#pkg-note-BUG
netAddr string netAddr string
netPath string netPath string
rpcClient *AuthRPCClient rpcClient *storageRPCClient
} }
const ( const (
@ -97,6 +99,104 @@ func toStorageErr(err error) error {
return err return err
} }
// storageRPCClient is a wrapper type for RPCClient which provides JWT based authentication across reconnects.
type storageRPCClient struct {
sync.Mutex
cfg storageConfig
rpc *RPCClient // reconnect'able rpc client built on top of net/rpc Client
serverToken string // Disk rpc JWT based token.
serverVersion string // Server version exchanged by the RPC.
}
// Storage config represents authentication credentials and Login
// method name to be used for fetching JWT tokens from the storage
// server.
type storageConfig struct {
addr string // Network address path of storage RPC server.
path string // Network storage path for HTTP dial.
secureConn bool // Indicates if this storage RPC is on a secured connection.
creds credential
}
// newStorageClient - returns a jwt based authenticated (go) storage rpc client.
func newStorageClient(storageCfg storageConfig) *storageRPCClient {
return &storageRPCClient{
// Save the config.
cfg: storageCfg,
rpc: newRPCClient(storageCfg.addr, storageCfg.path, storageCfg.secureConn),
}
}
// Close - closes underlying rpc connection.
func (storageClient *storageRPCClient) Close() error {
storageClient.Lock()
// reset token on closing a connection
storageClient.serverToken = ""
storageClient.Unlock()
return storageClient.rpc.Close()
}
// Login - a jwt based authentication is performed with rpc server.
func (storageClient *storageRPCClient) Login() (err error) {
storageClient.Lock()
// As soon as the function returns unlock,
defer storageClient.Unlock()
// Return if token is already set.
if storageClient.serverToken != "" {
return nil
}
reply := RPCLoginReply{}
if err = storageClient.rpc.Call("Storage.LoginHandler", RPCLoginArgs{
Username: storageClient.cfg.creds.AccessKey,
Password: storageClient.cfg.creds.SecretKey,
}, &reply); err != nil {
return err
}
// Validate if version do indeed match.
if reply.ServerVersion != Version {
return errServerVersionMismatch
}
// Validate if server timestamp is skewed.
curTime := time.Now().UTC()
if curTime.Sub(reply.Timestamp) > globalMaxSkewTime {
return errServerTimeMismatch
}
// Set token, time stamp as received from a successful login call.
storageClient.serverToken = reply.Token
storageClient.serverVersion = reply.ServerVersion
return nil
}
// Call - If rpc connection isn't established yet since previous disconnect,
// connection is established, a jwt authenticated login is performed and then
// the call is performed.
func (storageClient *storageRPCClient) Call(serviceMethod string, args interface {
SetToken(token string)
SetTimestamp(tstamp time.Time)
}, reply interface{}) (err error) {
// On successful login, attempt the call.
if err = storageClient.Login(); err != nil {
return err
}
// Set token and timestamp before the rpc call.
args.SetToken(storageClient.serverToken)
args.SetTimestamp(time.Now().UTC())
// Call the underlying rpc.
err = storageClient.rpc.Call(serviceMethod, args, reply)
// Invalidate token, and mark it for re-login.
if err == rpc.ErrShutdown {
storageClient.Close()
}
return err
}
// Initialize new storage rpc client. // Initialize new storage rpc client.
func newStorageRPC(ep *url.URL) (StorageAPI, error) { func newStorageRPC(ep *url.URL) (StorageAPI, error) {
if ep == nil { if ep == nil {
@ -108,28 +208,28 @@ func newStorageRPC(ep *url.URL) (StorageAPI, error) {
rpcAddr := ep.Host rpcAddr := ep.Host
// Initialize rpc client with network address and rpc path. // Initialize rpc client with network address and rpc path.
accessKeyID := serverConfig.GetCredential().AccessKey accessKey := serverConfig.GetCredential().AccessKey
secretAccessKey := serverConfig.GetCredential().SecretKey secretKey := serverConfig.GetCredential().SecretKey
if ep.User != nil { if ep.User != nil {
accessKeyID = ep.User.Username() accessKey = ep.User.Username()
if key, set := ep.User.Password(); set { if key, set := ep.User.Password(); set {
secretAccessKey = key secretKey = key
} }
} }
rpcClient := newAuthClient(&authConfig{
accessKey: accessKeyID,
secretKey: secretAccessKey,
secureConn: isSSL(),
address: rpcAddr,
path: rpcPath,
loginMethod: "Storage.LoginHandler",
})
// Initialize network storage. // Initialize network storage.
ndisk := &networkStorage{ ndisk := &networkStorage{
netAddr: ep.Host, netAddr: ep.Host,
netPath: getPath(ep), netPath: getPath(ep),
rpcClient: rpcClient, rpcClient: newStorageClient(storageConfig{
addr: rpcAddr,
path: rpcPath,
creds: credential{
AccessKey: accessKey,
SecretKey: secretKey,
},
secureConn: isSSL(),
}),
} }
// Returns successfully here. // Returns successfully here.