server_help.go 4.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216
  1. package zk
  2. import (
  3. "fmt"
  4. "io"
  5. "io/ioutil"
  6. "math/rand"
  7. "os"
  8. "path/filepath"
  9. "strings"
  10. "time"
  11. )
  12. func init() {
  13. rand.Seed(time.Now().UnixNano())
  14. }
  15. type TestServer struct {
  16. Port int
  17. Path string
  18. Srv *Server
  19. }
  20. type TestCluster struct {
  21. Path string
  22. Servers []TestServer
  23. }
  24. func StartTestCluster(size int, stdout, stderr io.Writer) (*TestCluster, error) {
  25. tmpPath, err := ioutil.TempDir("", "gozk")
  26. if err != nil {
  27. return nil, err
  28. }
  29. success := false
  30. startPort := int(rand.Int31n(6000) + 10000)
  31. cluster := &TestCluster{Path: tmpPath}
  32. defer func() {
  33. if !success {
  34. cluster.Stop()
  35. }
  36. }()
  37. for serverN := 0; serverN < size; serverN++ {
  38. srvPath := filepath.Join(tmpPath, fmt.Sprintf("srv%d", serverN))
  39. if err := os.Mkdir(srvPath, 0700); err != nil {
  40. return nil, err
  41. }
  42. port := startPort + serverN*3
  43. cfg := ServerConfig{
  44. ClientPort: port,
  45. DataDir: srvPath,
  46. }
  47. for i := 0; i < size; i++ {
  48. cfg.Servers = append(cfg.Servers, ServerConfigServer{
  49. ID: i + 1,
  50. Host: "127.0.0.1",
  51. PeerPort: startPort + i*3 + 1,
  52. LeaderElectionPort: startPort + i*3 + 2,
  53. })
  54. }
  55. cfgPath := filepath.Join(srvPath, "zoo.cfg")
  56. fi, err := os.Create(cfgPath)
  57. if err != nil {
  58. return nil, err
  59. }
  60. err = cfg.Marshall(fi)
  61. fi.Close()
  62. if err != nil {
  63. return nil, err
  64. }
  65. fi, err = os.Create(filepath.Join(srvPath, "myid"))
  66. if err != nil {
  67. return nil, err
  68. }
  69. _, err = fmt.Fprintf(fi, "%d\n", serverN+1)
  70. fi.Close()
  71. if err != nil {
  72. return nil, err
  73. }
  74. srv := &Server{
  75. ConfigPath: cfgPath,
  76. Stdout: stdout,
  77. Stderr: stderr,
  78. }
  79. if err := srv.Start(); err != nil {
  80. return nil, err
  81. }
  82. cluster.Servers = append(cluster.Servers, TestServer{
  83. Path: srvPath,
  84. Port: cfg.ClientPort,
  85. Srv: srv,
  86. })
  87. }
  88. if err := cluster.waitForStart(10, time.Second); err != nil {
  89. return nil, err
  90. }
  91. success = true
  92. return cluster, nil
  93. }
  94. func (tc *TestCluster) Connect(idx int) (*Conn, error) {
  95. zk, _, err := Connect([]string{fmt.Sprintf("127.0.0.1:%d", tc.Servers[idx].Port)}, time.Second*15)
  96. return zk, err
  97. }
  98. func (tc *TestCluster) ConnectAll() (*Conn, <-chan Event, error) {
  99. return tc.ConnectAllTimeout(time.Second * 15)
  100. }
  101. func (tc *TestCluster) ConnectAllTimeout(sessionTimeout time.Duration) (*Conn, <-chan Event, error) {
  102. return tc.ConnectWithOptions(sessionTimeout)
  103. }
  104. func (tc *TestCluster) ConnectWithOptions(sessionTimeout time.Duration, options ...connOption) (*Conn, <-chan Event, error) {
  105. hosts := make([]string, len(tc.Servers))
  106. for i, srv := range tc.Servers {
  107. hosts[i] = fmt.Sprintf("127.0.0.1:%d", srv.Port)
  108. }
  109. zk, ch, err := Connect(hosts, sessionTimeout, options...)
  110. return zk, ch, err
  111. }
  112. func (tc *TestCluster) Stop() error {
  113. for _, srv := range tc.Servers {
  114. srv.Srv.Stop()
  115. }
  116. defer os.RemoveAll(tc.Path)
  117. return tc.waitForStop(5, time.Second)
  118. }
  119. // waitForStart blocks until the cluster is up
  120. func (tc *TestCluster) waitForStart(maxRetry int, interval time.Duration) error {
  121. // verify that the servers are up with SRVR
  122. serverAddrs := make([]string, len(tc.Servers))
  123. for i, s := range tc.Servers {
  124. serverAddrs[i] = fmt.Sprintf("127.0.0.1:%d", s.Port)
  125. }
  126. for i := 0; i < maxRetry; i++ {
  127. _, ok := FLWSrvr(serverAddrs, time.Second)
  128. if ok {
  129. return nil
  130. }
  131. time.Sleep(interval)
  132. }
  133. return fmt.Errorf("unable to verify health of servers")
  134. }
  135. // waitForStop blocks until the cluster is down
  136. func (tc *TestCluster) waitForStop(maxRetry int, interval time.Duration) error {
  137. // verify that the servers are up with RUOK
  138. serverAddrs := make([]string, len(tc.Servers))
  139. for i, s := range tc.Servers {
  140. serverAddrs[i] = fmt.Sprintf("127.0.0.1:%d", s.Port)
  141. }
  142. var success bool
  143. for i := 0; i < maxRetry && !success; i++ {
  144. success = true
  145. for _, ok := range FLWRuok(serverAddrs, time.Second) {
  146. if ok {
  147. success = false
  148. }
  149. }
  150. if !success {
  151. time.Sleep(interval)
  152. }
  153. }
  154. if !success {
  155. return fmt.Errorf("unable to verify servers are down")
  156. }
  157. return nil
  158. }
  159. func (tc *TestCluster) StartServer(server string) {
  160. for _, s := range tc.Servers {
  161. if strings.HasSuffix(server, fmt.Sprintf(":%d", s.Port)) {
  162. s.Srv.Start()
  163. return
  164. }
  165. }
  166. panic(fmt.Sprintf("Unknown server: %s", server))
  167. }
  168. func (tc *TestCluster) StopServer(server string) {
  169. for _, s := range tc.Servers {
  170. if strings.HasSuffix(server, fmt.Sprintf(":%d", s.Port)) {
  171. s.Srv.Stop()
  172. return
  173. }
  174. }
  175. panic(fmt.Sprintf("Unknown server: %s", server))
  176. }
  177. func (tc *TestCluster) StartAllServers() error {
  178. for _, s := range tc.Servers {
  179. if err := s.Srv.Start(); err != nil {
  180. return fmt.Errorf(
  181. "Failed to start server listening on port `%d` : %+v", s.Port, err)
  182. }
  183. }
  184. return nil
  185. }
  186. func (tc *TestCluster) StopAllServers() error {
  187. for _, s := range tc.Servers {
  188. if err := s.Srv.Stop(); err != nil {
  189. return fmt.Errorf(
  190. "Failed to stop server listening on port `%d` : %+v", s.Port, err)
  191. }
  192. }
  193. return nil
  194. }