maintenance.go 7.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243
  1. // Copyright 2016 The etcd Authors
  2. //
  3. // Licensed under the Apache License, Version 2.0 (the "License");
  4. // you may not use this file except in compliance with the License.
  5. // You may obtain a copy of the License at
  6. //
  7. // http://www.apache.org/licenses/LICENSE-2.0
  8. //
  9. // Unless required by applicable law or agreed to in writing, software
  10. // distributed under the License is distributed on an "AS IS" BASIS,
  11. // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  12. // See the License for the specific language governing permissions and
  13. // limitations under the License.
  14. package clientv3
  15. import (
  16. "context"
  17. "fmt"
  18. "io"
  19. pb "go.etcd.io/etcd/etcdserver/etcdserverpb"
  20. "go.uber.org/zap"
  21. "google.golang.org/grpc"
  22. )
  23. type (
  24. DefragmentResponse pb.DefragmentResponse
  25. AlarmResponse pb.AlarmResponse
  26. AlarmMember pb.AlarmMember
  27. StatusResponse pb.StatusResponse
  28. HashKVResponse pb.HashKVResponse
  29. MoveLeaderResponse pb.MoveLeaderResponse
  30. )
  31. type Maintenance interface {
  32. // AlarmList gets all active alarms.
  33. AlarmList(ctx context.Context) (*AlarmResponse, error)
  34. // AlarmDisarm disarms a given alarm.
  35. AlarmDisarm(ctx context.Context, m *AlarmMember) (*AlarmResponse, error)
  36. // Defragment releases wasted space from internal fragmentation on a given etcd member.
  37. // Defragment is only needed when deleting a large number of keys and want to reclaim
  38. // the resources.
  39. // Defragment is an expensive operation. User should avoid defragmenting multiple members
  40. // at the same time.
  41. // To defragment multiple members in the cluster, user need to call defragment multiple
  42. // times with different endpoints.
  43. Defragment(ctx context.Context, endpoint string) (*DefragmentResponse, error)
  44. // Status gets the status of the endpoint.
  45. Status(ctx context.Context, endpoint string) (*StatusResponse, error)
  46. // HashKV returns a hash of the KV state at the time of the RPC.
  47. // If revision is zero, the hash is computed on all keys. If the revision
  48. // is non-zero, the hash is computed on all keys at or below the given revision.
  49. HashKV(ctx context.Context, endpoint string, rev int64) (*HashKVResponse, error)
  50. // Snapshot provides a reader for a point-in-time snapshot of etcd.
  51. // If the context "ctx" is canceled or timed out, reading from returned
  52. // "io.ReadCloser" would error out (e.g. context.Canceled, context.DeadlineExceeded).
  53. Snapshot(ctx context.Context) (io.ReadCloser, error)
  54. // MoveLeader requests current leader to transfer its leadership to the transferee.
  55. // Request must be made to the leader.
  56. MoveLeader(ctx context.Context, transfereeID uint64) (*MoveLeaderResponse, error)
  57. }
  58. type maintenance struct {
  59. lg *zap.Logger
  60. dial func(endpoint string) (pb.MaintenanceClient, func(), error)
  61. remote pb.MaintenanceClient
  62. callOpts []grpc.CallOption
  63. }
  64. func NewMaintenance(c *Client) Maintenance {
  65. api := &maintenance{
  66. lg: c.lg,
  67. dial: func(endpoint string) (pb.MaintenanceClient, func(), error) {
  68. conn, err := c.Dial(endpoint)
  69. if err != nil {
  70. return nil, nil, fmt.Errorf("failed to dial endpoint %s with maintenance client: %v", endpoint, err)
  71. }
  72. cancel := func() { conn.Close() }
  73. return RetryMaintenanceClient(c, conn), cancel, nil
  74. },
  75. remote: RetryMaintenanceClient(c, c.conn),
  76. }
  77. if c != nil {
  78. api.callOpts = c.callOpts
  79. }
  80. return api
  81. }
  82. func NewMaintenanceFromMaintenanceClient(remote pb.MaintenanceClient, c *Client) Maintenance {
  83. api := &maintenance{
  84. lg: c.lg,
  85. dial: func(string) (pb.MaintenanceClient, func(), error) {
  86. return remote, func() {}, nil
  87. },
  88. remote: remote,
  89. }
  90. if c != nil {
  91. api.callOpts = c.callOpts
  92. }
  93. return api
  94. }
  95. func (m *maintenance) AlarmList(ctx context.Context) (*AlarmResponse, error) {
  96. req := &pb.AlarmRequest{
  97. Action: pb.AlarmRequest_GET,
  98. MemberID: 0, // all
  99. Alarm: pb.AlarmType_NONE, // all
  100. }
  101. resp, err := m.remote.Alarm(ctx, req, m.callOpts...)
  102. if err == nil {
  103. return (*AlarmResponse)(resp), nil
  104. }
  105. return nil, toErr(ctx, err)
  106. }
  107. func (m *maintenance) AlarmDisarm(ctx context.Context, am *AlarmMember) (*AlarmResponse, error) {
  108. req := &pb.AlarmRequest{
  109. Action: pb.AlarmRequest_DEACTIVATE,
  110. MemberID: am.MemberID,
  111. Alarm: am.Alarm,
  112. }
  113. if req.MemberID == 0 && req.Alarm == pb.AlarmType_NONE {
  114. ar, err := m.AlarmList(ctx)
  115. if err != nil {
  116. return nil, toErr(ctx, err)
  117. }
  118. ret := AlarmResponse{}
  119. for _, am := range ar.Alarms {
  120. dresp, derr := m.AlarmDisarm(ctx, (*AlarmMember)(am))
  121. if derr != nil {
  122. return nil, toErr(ctx, derr)
  123. }
  124. ret.Alarms = append(ret.Alarms, dresp.Alarms...)
  125. }
  126. return &ret, nil
  127. }
  128. resp, err := m.remote.Alarm(ctx, req, m.callOpts...)
  129. if err == nil {
  130. return (*AlarmResponse)(resp), nil
  131. }
  132. return nil, toErr(ctx, err)
  133. }
  134. func (m *maintenance) Defragment(ctx context.Context, endpoint string) (*DefragmentResponse, error) {
  135. remote, cancel, err := m.dial(endpoint)
  136. if err != nil {
  137. return nil, toErr(ctx, err)
  138. }
  139. defer cancel()
  140. resp, err := remote.Defragment(ctx, &pb.DefragmentRequest{}, m.callOpts...)
  141. if err != nil {
  142. return nil, toErr(ctx, err)
  143. }
  144. return (*DefragmentResponse)(resp), nil
  145. }
  146. func (m *maintenance) Status(ctx context.Context, endpoint string) (*StatusResponse, error) {
  147. remote, cancel, err := m.dial(endpoint)
  148. if err != nil {
  149. return nil, toErr(ctx, err)
  150. }
  151. defer cancel()
  152. resp, err := remote.Status(ctx, &pb.StatusRequest{}, m.callOpts...)
  153. if err != nil {
  154. return nil, toErr(ctx, err)
  155. }
  156. return (*StatusResponse)(resp), nil
  157. }
  158. func (m *maintenance) HashKV(ctx context.Context, endpoint string, rev int64) (*HashKVResponse, error) {
  159. remote, cancel, err := m.dial(endpoint)
  160. if err != nil {
  161. return nil, toErr(ctx, err)
  162. }
  163. defer cancel()
  164. resp, err := remote.HashKV(ctx, &pb.HashKVRequest{Revision: rev}, m.callOpts...)
  165. if err != nil {
  166. return nil, toErr(ctx, err)
  167. }
  168. return (*HashKVResponse)(resp), nil
  169. }
  170. func (m *maintenance) Snapshot(ctx context.Context) (io.ReadCloser, error) {
  171. ss, err := m.remote.Snapshot(ctx, &pb.SnapshotRequest{}, append(m.callOpts, withMax(defaultStreamMaxRetries))...)
  172. if err != nil {
  173. return nil, toErr(ctx, err)
  174. }
  175. m.lg.Info("opened snapshot stream; downloading")
  176. pr, pw := io.Pipe()
  177. go func() {
  178. for {
  179. resp, err := ss.Recv()
  180. if err != nil {
  181. switch err {
  182. case io.EOF:
  183. m.lg.Info("completed snapshot read; closing")
  184. default:
  185. m.lg.Warn("failed to receive from snapshot stream; closing", zap.Error(err))
  186. }
  187. pw.CloseWithError(err)
  188. return
  189. }
  190. // can "resp == nil && err == nil"
  191. // before we receive snapshot SHA digest?
  192. // No, server sends EOF with an empty response
  193. // after it sends SHA digest at the end
  194. if _, werr := pw.Write(resp.Blob); werr != nil {
  195. pw.CloseWithError(werr)
  196. return
  197. }
  198. }
  199. }()
  200. return &snapshotReadCloser{ctx: ctx, ReadCloser: pr}, nil
  201. }
  202. type snapshotReadCloser struct {
  203. ctx context.Context
  204. io.ReadCloser
  205. }
  206. func (rc *snapshotReadCloser) Read(p []byte) (n int, err error) {
  207. n, err = rc.ReadCloser.Read(p)
  208. return n, toErr(rc.ctx, err)
  209. }
  210. func (m *maintenance) MoveLeader(ctx context.Context, transfereeID uint64) (*MoveLeaderResponse, error) {
  211. resp, err := m.remote.MoveLeader(ctx, &pb.MoveLeaderRequest{TargetID: transfereeID}, m.callOpts...)
  212. return (*MoveLeaderResponse)(resp), toErr(ctx, err)
  213. }