clutser_test.go 4.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219
  1. package cluster
  2. import (
  3. "testing"
  4. "time"
  5. "github.com/langgenius/dify-plugin-daemon/internal/types/app"
  6. "github.com/langgenius/dify-plugin-daemon/internal/utils/cache"
  7. "github.com/langgenius/dify-plugin-daemon/internal/utils/log"
  8. "github.com/langgenius/dify-plugin-daemon/internal/utils/routine"
  9. )
  10. func createSimulationCluster(nums int) ([]*Cluster, error) {
  11. err := cache.InitRedisClient("0.0.0.0:6379", "difyai123456")
  12. if err != nil {
  13. return nil, err
  14. }
  15. result := make([]*Cluster, 0)
  16. for i := 0; i < nums; i++ {
  17. result = append(result, NewCluster(&app.Config{
  18. ServerPort: 12121,
  19. }, nil))
  20. }
  21. log.SetShowLog(false)
  22. routine.InitPool(1024)
  23. // delete master key
  24. if err := cache.Del(PREEMPTION_LOCK_KEY); err != nil {
  25. return nil, err
  26. }
  27. return result, nil
  28. }
  29. func launchSimulationCluster(clusters []*Cluster) {
  30. for _, cluster := range clusters {
  31. cluster.Launch()
  32. }
  33. }
  34. func closeSimulationCluster(clusters []*Cluster, t *testing.T) {
  35. for _, cluster := range clusters {
  36. cluster.Close()
  37. // wait for the cluster to close
  38. <-cluster.NotifyClusterStopped()
  39. // check if the cluster is closed
  40. _, err := cache.GetMapField[node](CLUSTER_STATUS_HASH_MAP_KEY, cluster.id)
  41. if err == nil {
  42. t.Errorf("cluster is not closed")
  43. return
  44. }
  45. }
  46. }
  47. func TestSingleClusterLifetime(t *testing.T) {
  48. clusters, err := createSimulationCluster(1)
  49. if err != nil {
  50. t.Errorf("create simulation cluster failed: %v", err)
  51. return
  52. }
  53. launchSimulationCluster(clusters)
  54. defer closeSimulationCluster(clusters, t)
  55. <-clusters[0].NotifyBecomeMaster()
  56. _, err = cache.GetMapField[node](CLUSTER_STATUS_HASH_MAP_KEY, clusters[0].id)
  57. if err != nil {
  58. t.Errorf("get cluster status failed: %v", err)
  59. return
  60. }
  61. }
  62. func TestMultipleClusterLifetime(t *testing.T) {
  63. clusters, err := createSimulationCluster(3)
  64. if err != nil {
  65. t.Errorf("create simulation cluster failed: %v", err)
  66. return
  67. }
  68. launchSimulationCluster(clusters)
  69. defer closeSimulationCluster(clusters, t)
  70. select {
  71. case <-clusters[0].NotifyBecomeMaster():
  72. case <-clusters[1].NotifyBecomeMaster():
  73. case <-clusters[2].NotifyBecomeMaster():
  74. }
  75. hasMaster := false
  76. for _, cluster := range clusters {
  77. _, err := cache.GetMapField[node](CLUSTER_STATUS_HASH_MAP_KEY, cluster.id)
  78. if err != nil {
  79. t.Errorf("get cluster status failed: %v", err)
  80. return
  81. }
  82. if cluster.IsMaster() {
  83. if hasMaster {
  84. t.Errorf("multiple master")
  85. return
  86. } else {
  87. hasMaster = true
  88. }
  89. }
  90. }
  91. if !hasMaster {
  92. t.Errorf("no master")
  93. }
  94. }
  95. func TestClusterSubstituteMaster(t *testing.T) {
  96. clusters, err := createSimulationCluster(3)
  97. if err != nil {
  98. t.Errorf("create simulation cluster failed: %v", err)
  99. return
  100. }
  101. launchSimulationCluster(clusters)
  102. defer closeSimulationCluster(clusters, t)
  103. select {
  104. case <-clusters[0].NotifyBecomeMaster():
  105. case <-clusters[1].NotifyBecomeMaster():
  106. case <-clusters[2].NotifyBecomeMaster():
  107. }
  108. // close the master
  109. originalMasterId := ""
  110. for _, cluster := range clusters {
  111. if cluster.IsMaster() {
  112. cluster.Close()
  113. originalMasterId = cluster.id
  114. break
  115. }
  116. }
  117. if originalMasterId == "" {
  118. t.Errorf("no master")
  119. return
  120. }
  121. time.Sleep(clusters[0].masterLockExpiredTime + time.Second)
  122. hasMaster := false
  123. for _, cluster := range clusters {
  124. if cluster.id == originalMasterId {
  125. continue
  126. }
  127. _, err := cache.GetMapField[node](CLUSTER_STATUS_HASH_MAP_KEY, cluster.id)
  128. if err != nil {
  129. t.Errorf("get cluster status failed: %v", err)
  130. return
  131. }
  132. if cluster.IsMaster() {
  133. if hasMaster {
  134. t.Errorf("multiple substitute master")
  135. return
  136. } else {
  137. hasMaster = true
  138. }
  139. }
  140. }
  141. if !hasMaster {
  142. t.Errorf("no substitute master")
  143. }
  144. }
  145. func TestClusterAutoGCNoLongerActiveNode(t *testing.T) {
  146. clusters, err := createSimulationCluster(3)
  147. if err != nil {
  148. t.Errorf("create simulation cluster failed: %v", err)
  149. return
  150. }
  151. launchSimulationCluster(clusters)
  152. defer closeSimulationCluster(clusters, t)
  153. select {
  154. case <-clusters[0].NotifyBecomeMaster():
  155. case <-clusters[1].NotifyBecomeMaster():
  156. case <-clusters[2].NotifyBecomeMaster():
  157. }
  158. // randomly close a slave node to close
  159. slaveNodeId := ""
  160. for _, cluster := range clusters {
  161. if !cluster.IsMaster() {
  162. slaveNodeId = cluster.id
  163. cluster.Close()
  164. // wait for the cluster to close
  165. <-cluster.NotifyClusterStopped()
  166. // recover the node status
  167. if err := cluster.updateNodeStatus(); err != nil {
  168. t.Errorf("failed to recover the node status: %v", err)
  169. return
  170. }
  171. break
  172. }
  173. }
  174. if slaveNodeId == "" {
  175. t.Errorf("no slave node")
  176. return
  177. }
  178. // wait for master gc task
  179. time.Sleep(clusters[0].nodeDisconnectedTimeout*2 + time.Second)
  180. _, err = cache.GetMapField[node](CLUSTER_STATUS_HASH_MAP_KEY, slaveNodeId)
  181. if err == nil {
  182. t.Errorf("slave node is not collected by master gc automatically")
  183. return
  184. }
  185. }