master_server.go 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439
  1. package weed_server
  2. import (
  3. "context"
  4. "fmt"
  5. "net/http"
  6. "net/http/httputil"
  7. "net/url"
  8. "os"
  9. "regexp"
  10. "runtime"
  11. "strings"
  12. "sync"
  13. "time"
  14. "github.com/seaweedfs/seaweedfs/weed/stats"
  15. "github.com/seaweedfs/seaweedfs/weed/telemetry"
  16. "github.com/seaweedfs/seaweedfs/weed/cluster"
  17. "github.com/seaweedfs/seaweedfs/weed/pb"
  18. "github.com/gorilla/mux"
  19. hashicorpRaft "github.com/hashicorp/raft"
  20. "github.com/seaweedfs/raft"
  21. "google.golang.org/grpc"
  22. "github.com/seaweedfs/seaweedfs/weed/glog"
  23. "github.com/seaweedfs/seaweedfs/weed/pb/master_pb"
  24. "github.com/seaweedfs/seaweedfs/weed/security"
  25. "github.com/seaweedfs/seaweedfs/weed/sequence"
  26. "github.com/seaweedfs/seaweedfs/weed/shell"
  27. "github.com/seaweedfs/seaweedfs/weed/topology"
  28. "github.com/seaweedfs/seaweedfs/weed/util"
  29. util_http "github.com/seaweedfs/seaweedfs/weed/util/http"
  30. "github.com/seaweedfs/seaweedfs/weed/util/version"
  31. "github.com/seaweedfs/seaweedfs/weed/wdclient"
  32. )
  33. const (
  34. SequencerType = "master.sequencer.type"
  35. SequencerSnowflakeId = "master.sequencer.sequencer_snowflake_id"
  36. )
  37. type MasterOption struct {
  38. Master pb.ServerAddress
  39. MetaFolder string
  40. VolumeSizeLimitMB uint32
  41. VolumePreallocate bool
  42. MaxParallelVacuumPerServer int
  43. // PulseSeconds int
  44. DefaultReplicaPlacement string
  45. GarbageThreshold float64
  46. WhiteList []string
  47. DisableHttp bool
  48. MetricsAddress string
  49. MetricsIntervalSec int
  50. IsFollower bool
  51. TelemetryUrl string
  52. TelemetryEnabled bool
  53. VolumeGrowthDisabled bool
  54. }
  55. type MasterServer struct {
  56. master_pb.UnimplementedSeaweedServer
  57. option *MasterOption
  58. guard *security.Guard
  59. preallocateSize int64
  60. Topo *topology.Topology
  61. vg *topology.VolumeGrowth
  62. volumeGrowthRequestChan chan *topology.VolumeGrowRequest
  63. // notifying clients
  64. clientChansLock sync.RWMutex
  65. clientChans map[string]chan *master_pb.KeepConnectedResponse
  66. grpcDialOption grpc.DialOption
  67. MasterClient *wdclient.MasterClient
  68. adminLocks *AdminLocks
  69. Cluster *cluster.Cluster
  70. // telemetry
  71. telemetryCollector *telemetry.Collector
  72. }
  73. func NewMasterServer(r *mux.Router, option *MasterOption, peers map[string]pb.ServerAddress) *MasterServer {
  74. v := util.GetViper()
  75. signingKey := v.GetString("jwt.signing.key")
  76. v.SetDefault("jwt.signing.expires_after_seconds", 10)
  77. expiresAfterSec := v.GetInt("jwt.signing.expires_after_seconds")
  78. readSigningKey := v.GetString("jwt.signing.read.key")
  79. v.SetDefault("jwt.signing.read.expires_after_seconds", 60)
  80. readExpiresAfterSec := v.GetInt("jwt.signing.read.expires_after_seconds")
  81. v.SetDefault("master.replication.treat_replication_as_minimums", false)
  82. replicationAsMin := v.GetBool("master.replication.treat_replication_as_minimums")
  83. v.SetDefault("master.volume_growth.copy_1", topology.VolumeGrowStrategy.Copy1Count)
  84. v.SetDefault("master.volume_growth.copy_2", topology.VolumeGrowStrategy.Copy2Count)
  85. v.SetDefault("master.volume_growth.copy_3", topology.VolumeGrowStrategy.Copy3Count)
  86. v.SetDefault("master.volume_growth.copy_other", topology.VolumeGrowStrategy.CopyOtherCount)
  87. v.SetDefault("master.volume_growth.threshold", topology.VolumeGrowStrategy.Threshold)
  88. v.SetDefault("master.volume_growth.disable", false)
  89. option.VolumeGrowthDisabled = v.GetBool("master.volume_growth.disable")
  90. topology.VolumeGrowStrategy.Copy1Count = v.GetUint32("master.volume_growth.copy_1")
  91. topology.VolumeGrowStrategy.Copy2Count = v.GetUint32("master.volume_growth.copy_2")
  92. topology.VolumeGrowStrategy.Copy3Count = v.GetUint32("master.volume_growth.copy_3")
  93. topology.VolumeGrowStrategy.CopyOtherCount = v.GetUint32("master.volume_growth.copy_other")
  94. topology.VolumeGrowStrategy.Threshold = v.GetFloat64("master.volume_growth.threshold")
  95. whiteList := util.StringSplit(v.GetString("guard.white_list"), ",")
  96. var preallocateSize int64
  97. if option.VolumePreallocate {
  98. preallocateSize = int64(option.VolumeSizeLimitMB) * (1 << 20)
  99. }
  100. grpcDialOption := security.LoadClientTLS(v, "grpc.master")
  101. ms := &MasterServer{
  102. option: option,
  103. preallocateSize: preallocateSize,
  104. volumeGrowthRequestChan: make(chan *topology.VolumeGrowRequest, 1<<6),
  105. clientChans: make(map[string]chan *master_pb.KeepConnectedResponse),
  106. grpcDialOption: grpcDialOption,
  107. MasterClient: wdclient.NewMasterClient(grpcDialOption, "", cluster.MasterType, option.Master, "", "", *pb.NewServiceDiscoveryFromMap(peers)),
  108. adminLocks: NewAdminLocks(),
  109. Cluster: cluster.NewCluster(),
  110. }
  111. ms.MasterClient.SetOnPeerUpdateFn(ms.OnPeerUpdate)
  112. seq := ms.createSequencer(option)
  113. if nil == seq {
  114. glog.Fatalf("create sequencer failed.")
  115. }
  116. ms.Topo = topology.NewTopology("topo", seq, uint64(ms.option.VolumeSizeLimitMB)*1024*1024, 5, replicationAsMin)
  117. ms.vg = topology.NewDefaultVolumeGrowth()
  118. glog.V(0).Infoln("Volume Size Limit is", ms.option.VolumeSizeLimitMB, "MB")
  119. // Initialize telemetry after topology is created
  120. if option.TelemetryEnabled && option.TelemetryUrl != "" {
  121. telemetryClient := telemetry.NewClient(option.TelemetryUrl, option.TelemetryEnabled)
  122. ms.telemetryCollector = telemetry.NewCollector(telemetryClient, ms.Topo, ms.Cluster)
  123. ms.telemetryCollector.SetMasterServer(ms)
  124. // Set version and OS information
  125. ms.telemetryCollector.SetVersion(version.VERSION_NUMBER)
  126. ms.telemetryCollector.SetOS(runtime.GOOS + "/" + runtime.GOARCH)
  127. // Start periodic telemetry collection (every 24 hours)
  128. ms.telemetryCollector.StartPeriodicCollection(24 * time.Hour)
  129. }
  130. ms.guard = security.NewGuard(append(ms.option.WhiteList, whiteList...), signingKey, expiresAfterSec, readSigningKey, readExpiresAfterSec)
  131. handleStaticResources2(r)
  132. r.HandleFunc("/", ms.proxyToLeader(requestIDMiddleware(ms.uiStatusHandler)))
  133. r.HandleFunc("/ui/index.html", requestIDMiddleware(ms.uiStatusHandler))
  134. if !ms.option.DisableHttp {
  135. r.HandleFunc("/dir/assign", ms.proxyToLeader(ms.guard.WhiteList(requestIDMiddleware(ms.dirAssignHandler))))
  136. r.HandleFunc("/dir/lookup", ms.guard.WhiteList(requestIDMiddleware(ms.dirLookupHandler)))
  137. r.HandleFunc("/dir/status", ms.proxyToLeader(ms.guard.WhiteList(requestIDMiddleware(ms.dirStatusHandler))))
  138. r.HandleFunc("/col/delete", ms.proxyToLeader(ms.guard.WhiteList(requestIDMiddleware(ms.collectionDeleteHandler))))
  139. r.HandleFunc("/vol/grow", ms.proxyToLeader(ms.guard.WhiteList(requestIDMiddleware(ms.volumeGrowHandler))))
  140. r.HandleFunc("/vol/status", ms.proxyToLeader(ms.guard.WhiteList(requestIDMiddleware(ms.volumeStatusHandler))))
  141. r.HandleFunc("/vol/vacuum", ms.proxyToLeader(ms.guard.WhiteList(requestIDMiddleware(ms.volumeVacuumHandler))))
  142. r.HandleFunc("/submit", ms.guard.WhiteList(requestIDMiddleware(ms.submitFromMasterServerHandler)))
  143. r.HandleFunc("/collection/info", ms.guard.WhiteList(requestIDMiddleware(ms.collectionInfoHandler)))
  144. /*
  145. r.HandleFunc("/stats/health", ms.guard.WhiteList(statsHealthHandler))
  146. r.HandleFunc("/stats/counter", ms.guard.WhiteList(statsCounterHandler))
  147. r.HandleFunc("/stats/memory", ms.guard.WhiteList(statsMemoryHandler))
  148. */
  149. r.HandleFunc("/{fileId}", requestIDMiddleware(ms.redirectHandler))
  150. }
  151. ms.Topo.StartRefreshWritableVolumes(
  152. ms.grpcDialOption,
  153. ms.option.GarbageThreshold,
  154. ms.option.MaxParallelVacuumPerServer,
  155. topology.VolumeGrowStrategy.Threshold,
  156. ms.preallocateSize,
  157. )
  158. ms.ProcessGrowRequest()
  159. if !option.IsFollower {
  160. ms.startAdminScripts()
  161. }
  162. return ms
  163. }
  164. func (ms *MasterServer) SetRaftServer(raftServer *RaftServer) {
  165. var raftServerName string
  166. ms.Topo.RaftServerAccessLock.Lock()
  167. if raftServer.raftServer != nil {
  168. ms.Topo.RaftServer = raftServer.raftServer
  169. ms.Topo.RaftServer.AddEventListener(raft.LeaderChangeEventType, func(e raft.Event) {
  170. glog.V(0).Infof("leader change event: %+v => %+v", e.PrevValue(), e.Value())
  171. stats.MasterLeaderChangeCounter.WithLabelValues(fmt.Sprintf("%+v", e.Value())).Inc()
  172. if ms.Topo.RaftServer.Leader() != "" {
  173. glog.V(0).Infof("[%s] %s becomes leader.", ms.Topo.RaftServer.Name(), ms.Topo.RaftServer.Leader())
  174. ms.Topo.LastLeaderChangeTime = time.Now()
  175. }
  176. })
  177. raftServerName = fmt.Sprintf("[%s]", ms.Topo.RaftServer.Name())
  178. } else if raftServer.RaftHashicorp != nil {
  179. ms.Topo.HashicorpRaft = raftServer.RaftHashicorp
  180. raftServerName = ms.Topo.HashicorpRaft.String()
  181. ms.Topo.LastLeaderChangeTime = time.Now()
  182. }
  183. ms.Topo.RaftServerAccessLock.Unlock()
  184. if ms.Topo.IsLeader() {
  185. glog.V(0).Infof("%s I am the leader!", raftServerName)
  186. } else {
  187. var raftServerLeader string
  188. ms.Topo.RaftServerAccessLock.RLock()
  189. if ms.Topo.RaftServer != nil {
  190. raftServerLeader = ms.Topo.RaftServer.Leader()
  191. } else if ms.Topo.HashicorpRaft != nil {
  192. raftServerName = ms.Topo.HashicorpRaft.String()
  193. raftServerLeaderAddr, _ := ms.Topo.HashicorpRaft.LeaderWithID()
  194. raftServerLeader = string(raftServerLeaderAddr)
  195. }
  196. ms.Topo.RaftServerAccessLock.RUnlock()
  197. glog.V(0).Infof("%s %s - is the leader.", raftServerName, raftServerLeader)
  198. }
  199. }
  200. func (ms *MasterServer) proxyToLeader(f http.HandlerFunc) http.HandlerFunc {
  201. return func(w http.ResponseWriter, r *http.Request) {
  202. if ms.Topo.IsLeader() {
  203. f(w, r)
  204. return
  205. }
  206. // get the current raft leader
  207. leaderAddr, _ := ms.Topo.MaybeLeader()
  208. raftServerLeader := leaderAddr.ToHttpAddress()
  209. if raftServerLeader == "" {
  210. f(w, r)
  211. return
  212. }
  213. // determine the scheme based on HTTPS client configuration
  214. scheme := util_http.GetGlobalHttpClient().GetHttpScheme()
  215. targetUrl, err := url.Parse(scheme + "://" + raftServerLeader)
  216. if err != nil {
  217. writeJsonError(w, r, http.StatusInternalServerError,
  218. fmt.Errorf("Leader URL %s://%s Parse Error: %v", scheme, raftServerLeader, err))
  219. return
  220. }
  221. // proxy to leader
  222. glog.V(4).Infoln("proxying to leader", raftServerLeader, "using", scheme)
  223. proxy := httputil.NewSingleHostReverseProxy(targetUrl)
  224. proxy.Transport = util_http.GetGlobalHttpClient().GetClientTransport()
  225. proxy.ServeHTTP(w, r)
  226. }
  227. }
  228. func (ms *MasterServer) startAdminScripts() {
  229. v := util.GetViper()
  230. adminScripts := v.GetString("master.maintenance.scripts")
  231. if adminScripts == "" {
  232. return
  233. }
  234. glog.V(0).Infof("adminScripts: %v", adminScripts)
  235. v.SetDefault("master.maintenance.sleep_minutes", 17)
  236. sleepMinutes := v.GetFloat64("master.maintenance.sleep_minutes")
  237. scriptLines := strings.Split(adminScripts, "\n")
  238. if !strings.Contains(adminScripts, "lock") {
  239. scriptLines = append(append([]string{}, "lock"), scriptLines...)
  240. scriptLines = append(scriptLines, "unlock")
  241. }
  242. masterAddress := string(ms.option.Master)
  243. var shellOptions shell.ShellOptions
  244. shellOptions.GrpcDialOption = security.LoadClientTLS(v, "grpc.master")
  245. shellOptions.Masters = &masterAddress
  246. shellOptions.Directory = "/"
  247. emptyFilerGroup := ""
  248. shellOptions.FilerGroup = &emptyFilerGroup
  249. commandEnv := shell.NewCommandEnv(&shellOptions)
  250. reg, _ := regexp.Compile(`'.*?'|".*?"|\S+`)
  251. go commandEnv.MasterClient.KeepConnectedToMaster(context.Background())
  252. go func() {
  253. for {
  254. time.Sleep(time.Duration(sleepMinutes) * time.Minute)
  255. if ms.Topo.IsLeader() && ms.MasterClient.GetMaster(context.Background()) != "" {
  256. shellOptions.FilerAddress = ms.GetOneFiler(cluster.FilerGroupName(*shellOptions.FilerGroup))
  257. if shellOptions.FilerAddress == "" {
  258. continue
  259. }
  260. for _, line := range scriptLines {
  261. for _, c := range strings.Split(line, ";") {
  262. processEachCmd(reg, c, commandEnv)
  263. }
  264. }
  265. }
  266. }
  267. }()
  268. }
  269. func processEachCmd(reg *regexp.Regexp, line string, commandEnv *shell.CommandEnv) {
  270. cmds := reg.FindAllString(line, -1)
  271. if len(cmds) == 0 {
  272. return
  273. }
  274. args := make([]string, len(cmds[1:]))
  275. for i := range args {
  276. args[i] = strings.Trim(string(cmds[1+i]), "\"'")
  277. }
  278. cmd := cmds[0]
  279. for _, c := range shell.Commands {
  280. if c.Name() == cmd {
  281. if c.HasTag(shell.ResourceHeavy) {
  282. glog.Warningf("%s is resource heavy and should not run on master", cmd)
  283. continue
  284. }
  285. glog.V(0).Infof("executing: %s %v", cmd, args)
  286. if err := c.Do(args, commandEnv, os.Stdout); err != nil {
  287. glog.V(0).Infof("error: %v", err)
  288. }
  289. }
  290. }
  291. }
  292. func (ms *MasterServer) createSequencer(option *MasterOption) sequence.Sequencer {
  293. var seq sequence.Sequencer
  294. v := util.GetViper()
  295. seqType := strings.ToLower(v.GetString(SequencerType))
  296. glog.V(1).Infof("[%s] : [%s]", SequencerType, seqType)
  297. switch strings.ToLower(seqType) {
  298. case "snowflake":
  299. var err error
  300. snowflakeId := v.GetInt(SequencerSnowflakeId)
  301. seq, err = sequence.NewSnowflakeSequencer(string(option.Master), snowflakeId)
  302. if err != nil {
  303. glog.Error(err)
  304. seq = nil
  305. }
  306. case "raft":
  307. fallthrough
  308. default:
  309. seq = sequence.NewMemorySequencer()
  310. }
  311. return seq
  312. }
  313. func (ms *MasterServer) OnPeerUpdate(update *master_pb.ClusterNodeUpdate, startFrom time.Time) {
  314. ms.Topo.RaftServerAccessLock.RLock()
  315. defer ms.Topo.RaftServerAccessLock.RUnlock()
  316. if update.NodeType != cluster.MasterType || ms.Topo.HashicorpRaft == nil {
  317. return
  318. }
  319. glog.V(4).Infof("OnPeerUpdate: %+v", update)
  320. peerAddress := pb.ServerAddress(update.Address)
  321. peerName := string(peerAddress)
  322. if ms.Topo.HashicorpRaft.State() != hashicorpRaft.Leader {
  323. return
  324. }
  325. if update.IsAdd {
  326. raftServerFound := false
  327. for _, server := range ms.Topo.HashicorpRaft.GetConfiguration().Configuration().Servers {
  328. if string(server.ID) == peerName {
  329. raftServerFound = true
  330. }
  331. }
  332. if !raftServerFound {
  333. glog.V(0).Infof("adding new raft server: %s", peerName)
  334. ms.Topo.HashicorpRaft.AddVoter(
  335. hashicorpRaft.ServerID(peerName),
  336. hashicorpRaft.ServerAddress(peerAddress.ToGrpcAddress()), 0, 0)
  337. }
  338. } else {
  339. pb.WithMasterClient(false, peerAddress, ms.grpcDialOption, true, func(client master_pb.SeaweedClient) error {
  340. ctx, cancel := context.WithTimeout(context.TODO(), 15*time.Second)
  341. defer cancel()
  342. if _, err := client.Ping(ctx, &master_pb.PingRequest{Target: string(peerAddress), TargetType: cluster.MasterType}); err != nil {
  343. glog.V(0).Infof("master %s didn't respond to pings. remove raft server", peerName)
  344. if err := ms.MasterClient.WithClient(false, func(client master_pb.SeaweedClient) error {
  345. _, err := client.RaftRemoveServer(context.Background(), &master_pb.RaftRemoveServerRequest{
  346. Id: peerName,
  347. Force: false,
  348. })
  349. return err
  350. }); err != nil {
  351. glog.Warningf("failed removing old raft server: %v", err)
  352. return err
  353. }
  354. } else {
  355. glog.V(0).Infof("master %s successfully responded to ping", peerName)
  356. }
  357. return nil
  358. })
  359. }
  360. }
  361. func (ms *MasterServer) Shutdown() {
  362. if ms.Topo == nil || ms.Topo.HashicorpRaft == nil {
  363. return
  364. }
  365. if ms.Topo.HashicorpRaft.State() == hashicorpRaft.Leader {
  366. ms.Topo.HashicorpRaft.LeadershipTransfer()
  367. }
  368. ms.Topo.HashicorpRaft.Shutdown()
  369. }
  370. func (ms *MasterServer) Reload() {
  371. glog.V(0).Infoln("Reload master server...")
  372. util.LoadConfiguration("security", false)
  373. v := util.GetViper()
  374. ms.guard.UpdateWhiteList(append(ms.option.WhiteList,
  375. util.StringSplit(v.GetString("guard.white_list"), ",")...),
  376. )
  377. }